architecture:
  _target_: krt.models.np.attn_lnp.AttnLNP
  dim_hid: 128
  dim_lat: 128
  enc_v_depth: 4
  enc_qk_depth: 2
  enc_pre_depth: 4
  enc_post_depth: 2
  dec_depth: 3
  tr_num_samples: 4
  eval_num_samples: 50
training:
  learning_rate: 5e-4
  weight_decay: 0.0
  lr_schedule: True
