
dataset         : "MNIST" 
task0_labels    : [0, 1, 2, 3, 4]                 # type: List[int], options in [0,9]
task1_labels    : [5, 6, 7, 8, 9]                 # type: List[int], options in [0,9]

full_model  : "SimpleMLP"
full_kwargs :
  input_size      : 784 # 28*28 = 784 MNSIT
  hidden_size     : ${control.hidden_size}
  num_classes     : 10
  activation      : ${control.activation}

teacher0_model  : "SimpleMLP"
teacher0_kwargs :
  input_size      : 784 # 28*28 = 784 MNSIT
  hidden_size     : ${control.hidden_size}
  num_classes     : 5
  activation      : ${control.activation}

teacher1_model  : "SimpleMLP"
teacher1_kwargs :
  input_size      : 784 # 28*28 = 784 MNSIT
  hidden_size     : ${control.hidden_size}
  num_classes     : 5
  activation      : ${control.activation}

student_model  : "DoubleHeadMLP"
student_kwargs :
  input_size      : 784 # 28*28 = 784 MNSIT
  hidden_size     : ${control.hidden_size}
  num_classes_per_head : 5
  activation      : ${control.activation}

init_method : ${control.init_method}
first_layer_bias : ${control.first_layer_bias}
student_equal_heads: ${control.same_head}

epochs_teacher  : 50                              # type: int > 0
epochs_t0       : 50                              # type: int > 0
epochs_t1       : 50                              # type: int > 0
BATCH_SIZE      : 64                              # type: int > 0
seed            : ${control.set_seed}             # type: int
learning_rate   : 0.01                            # type: float
momentum        : 0.0                             # type: float
detect_anomaly_flag : False                       # type: bool


control:
  hidden_size     : 10                            # type: int
  hidden_size_2   : 10                            # type: int
  set_seed        : 1                             # type: int
  tasks_key       : null                          # type: str
  alpha           : 0                             # type: float
  same_head       : False                         # type: bool
  init_method     : "kaiming"                     # type: str
  activation      : "relu"                        # type: str
  first_layer_bias: null                          # type: bool or null
