architecture:
  _target_: krt.models.np.attn_cnp.AttnCNP
  dim_hid: 128
  enc_v_depth: 4
  enc_qk_depth: 2
  enc_pre_depth: 4
  enc_post_depth: 2
  dec_depth: 3
training:
  learning_rate: 5e-4
  weight_decay: 0.0
  lr_schedule: True
