seed: 42
BATCH_SIZE: 64
learning_rate: 0.001
momentum: 0.9
epochs_teacher: 5
epochs_t0: 3
epochs_t1: 3
dataset: "MNIST"
student_equal_heads: true

full_model:
  name: "LinearModel"
full_kwargs:
  input_size: 784
  output_size: 10

teacher0_model:
  name: "LinearModel"
teacher0_kwargs:
  input_size: 784
  output_size: 10

teacher1_model:
  name: "LinearModel"
teacher1_kwargs:
  input_size: 784
  output_size: 10

student_model:
  name: "DualHeadLinearModel"
student_kwargs:
  input_size: 784
  output_size: 10

task0_labels: [0, 1, 2, 3, 4]
task1_labels: [5, 6, 7, 8, 9]

control:
  hidden_size: 10
  set_seed: 1
