# @package _global_
model:
  _target_: masked_autoencoding.src.models.vitca_deq.ViTCA

  localize_attn: true  # Localize transformer attn in a neighbourhood surrounding each cell
  localized_attn_neighbourhood: [3, 3]

  patch_size: 1  # Spatial patch size each cell overlaps
  overlapping_patches: false
  pe_method: vit_handcrafted  # Type of positional encoding/embedding for transformer. 'vit_handcrafted', 'nerf_handcrafted', 'learned', or null for no positional encoding
  nerf_pe_basis: raw_xy  # Choices: raw_xy, sin_cos, sin_cos_xy, sinc
  nerf_pe_max_freq: 5  # Max frequency of positional encoding. Measured as 2^L-1 where L = pe_max_freq. L = 5 -> 32x32.

  octaves: 0

  depth: 1
  heads: 4
  mlp_dim: 64
  dropout: 0.0
  cell_init: 'constant'  # 'constant' or 'random'
  cell_in_chns: 3
  cell_out_chns: 3
  cell_hidden_chns: 32
  embed_cells: true
  embed_dim: 128
  embed_dropout: 0.0

  f_solver: anderson
  f_thresh: 60
  b_solver: broyden
  b_thresh: 36
  stop_mode: abs
  eval_factor: 1.5
  ift: true
  safe_ift: false
  indexing: []
  sup_all: true
  phantom_grad: [1]
  tau: 1.0