

dataset:
  name: cifar100
  input_shape: [3,32,32]
  image_size: 32
  output_sizes: 1000
  data_dir: ...


network:
  _target_: src.networks.resnet.MultiTaskCNN
  input_shape:  [3,78,64]
  use_classifier: true
  trainable_weights: false
  task_groups: none
  num_possible_conv: 2
  image_size: ${dataset.image_size}
  dec_normal_bias_init: 0
  conv_normal_bias_init: 0
  dec_activation: nn.ReLU
  conv_activation: nn.ReLU
  coarse_labels: false
  pretrained: true
  number_of_resnet_to_cut: 1
  use_possible_bias: true
  use_dec_bias: true
  use_residual_connection: true


seed: 1
do_comodulation: false
do_attention: false
train_test_from_scratch: true

dataset_name: ${dataset.name}
n_train_test: 5
load_pretrained_weights: false
task_number: 40
copy_files_to_save: false
files_to_save: []

plot_gradients: false
plot_informative_neurons: false

do_only_output_weights: true

make_embeddings_plot: false
plot_pca_lda: true
plot_corruptions: false
plot_model_calibration: true
plot_adversarial: false
pretrain_coarse_labels: true
save_gains: true


pretrain_config:
  add_augmentations: true
  adversarial_training: false
  adversarial_eps: 0.05
  batch_size: 64
  max_epoch: 1
  lr:  0.0002
  image_size: ${network.image_size}
  do_l1_loss_on_controller: false
  l1_loss_weight: 0.000001
  eval_every_batch: false
  eval_every_n_batch: 1
  max_batch: -1
  log_freq: 200
  dataset_name: ${dataset.name}
  coarse_labels: ${pretrain_coarse_labels}
  fine_tasks: false
  plot_corruptions: false
  plot_adversarial: false
  data_dir: ${dataset.data_dir}

attention_config:
  add_augmentations: false
  adversarial_training: false
  adversarial_eps: 0.1
  do_l1_loss_on_controller: false  
  l1_loss_weight: 0.1
  batch_size: 64
  max_epoch: 10
  lr:  0.0005
  classifier_lr: 0.0005
  image_size: ${network.image_size}
  eval_every_batch: false
  eval_every_n_batch: 1
  max_batch: 100
  log_freq: 200
  retrain_everything: false
  dataset_name: ${dataset.name}
  coarse_labels: false
  plot_corruptions: ${plot_corruptions}
  plot_adversarial: ${plot_adversarial}
  data_dir: ${dataset.data_dir}
  
comodulation_config:
  add_augmentations: false
  adversarial_training: false
  adversarial_eps: 0.1
  do_l1_loss_on_controller: false  
  l1_loss_weight: 0.1
  batch_size: 64
  max_epoch: 10
  lr:  0.0005
  classifier_lr: 0.0005
  image_size: ${network.image_size}
  eval_every_batch: false
  eval_every_n_batch: 1
  max_batch: 100
  log_freq: 200
  retrain_everything: false
  dataset_name: ${dataset.name}
  coarse_labels: false
  plot_corruptions: ${plot_corruptions}
  plot_adversarial: ${plot_adversarial}
  data_dir: ${dataset.data_dir}

modulation_params:
  steps: 25
  num_tasks: ${task_number}
  retrain_last_layer: true
  retrain_everything:  false
  use_modulations_in_gain: true
  modulation_noise_mean: 0
  modulation_noise_std: 0.4
  comod_backprop: false
  normalize_gain_minmax_after: true
  only_train_added_params: false
  only_retrain_last: false
  compute_gain_once_with_train_set: false

controller:
  hidden_dim: 256
  num_layers: 2
  guided_init: false
  use_end_bias: true
  params_per_group: true
  do_act_end: false
  act_end: nn.Identity

hydra:
  run:
    dir: outputs/multitask/${dataset.name}/${now:%m.%d}/${now:%H%M%S%f}/

