# @package _global_

debug: false
device: "cuda"

hydra:
  mode: MULTIRUN
  sweeper:
    params:
      +model: ktst
      +data: mirt
      +reproduce/ktst/synthetic/mirt_aggregations: glob([*])
      +reproduce/ktst/synthetic/mirt_data: glob([*])
      data.num_students_train_val: 500,1000,2000,3000,4000,5000
      data.student_offset: -1.96
      data.batch_size: 100
      data.batch_size_val_and_test: 200
      data.seed: 0,1,2,3,4
      data.num_students_test: 1000
      data.num_questions: 1000
      data.num_responses_per_student: 40
      data.num_concepts: 10
      data.guessing_prob: 0.25
      model.d_model: 128
      model.nhead_tf: 4
      model.nhead_agg: 4
      model.num_layers_tf_enc: 4
      model.num_layers_tf_dec: 4
      model.num_layers_agg: 2
      model.dim_feedforward: 256
      model.dropout: 0.0
      model.dim_classifier: 256
      model.use_bias_emb: true
      +optimizer.theta_lr: 0.005
      model.attn_variant: learnable_alibi_monotonic_q_k
      trainer.eval_modes:
        - val
        - test
      trainer.num_epochs: 200
