defaults:
  - hyp: chess_default
  - model: dt_net_recall_2d

name: chess
test_data: 700_000
train_data: 600_000

model:
  width: 512

deq:
  f_solver: 'anderson'
  b_solver: 'anderson'
  f_thres: 40
  b_thres: 40
  stop_mode: 'rel'
  num_layers: 30
  in_channels: 12
  num_blocks: 2
  wnorm: True
  norm: "group"
  fp_init: "zeros"
  num_groups: 4 # Number of groups if using group norm; will be ignored for other norms
  extra:
    block: BASIC
  solver:
    lam: 1e-4
    m: 5
  loss:
    jac_loss: False
    jac_loss_weight: 0.1
    jac_loss_freq: 0.02
    pretrain_jac_loss_weight: 0.0
    jac_stop_epoch: 80
    jac_loss_incremental: 1e8
    layer_loss: False
    phantom_grad: False
    pg_tau: 0.5
    pg_iters: 3
    layer_idx:
      - 10
      - 20
      - 30
    gamma:
      - 0.01
      - 0.025
      - 0.05

train:
  pretrain_steps: 20