trials: 5
results_dir: results/mnist_add
dataset: mnist_add
num_workers: 8
batch_size: 2048
num_operands: 12
selected_digits:
  - [0,1,2]
  - [0,1,2]
  - [0,1,2]
  - [0,1,2]
  - [0,1,2,3,4]
  - [0,1,2,3,4]
  - [0,1,2,3,4]
  - [0,1,2,3,4]
  - [0,1,2,3,4,5,6,7,8,9]
  - [0,1,2,3,4,5,6,7,8,9]
  - [0,1,2,3,4,5,6,7,8,9]
  - [0,1,2,3,4,5,6,7,8,9]
threshold_labels: 30
noise_level: 0.0
max_epochs: 500
train_dataset_size: 10000
sampling_percent: 1
sampling_groups: True
skip_repr_evaluation: True
c2y_layers: [128, 128]

# Intervention Parameters
intervention_freq: 1
intervention_batch_size: 2048
intervention_policies:
    # - "intcem_policy"
    - "group_random"
    - "group_random_no_prior"
    - "group_coop_no_prior"
    - "behavioural_cloning_no_prior"
    - "group_uncertainty_no_prior"
    - "optimal_greedy_no_prior"
    - "global_val_error_no_prior"
    - "global_val_improvement_no_prior"

# DATASET VARIABLES
root_dir: data/mnist/
test_subsampling: 1
weight_loss: True
use_task_class_weights: True
check_val_every_n_epoch: 2

shared_params:
    top_k_accuracy: null
    save_model: True
    patience: 5
    emb_size: 16
    extra_dims: 0
    concept_loss_weight: 10
    learning_rate: 0.001
    weight_decay: 0.000004
    c_extractor_arch: resnet18
    optimizer: sgd
    bool: False
    early_stopping_monitor: val_loss
    early_stopping_mode: min
    early_stopping_delta: 0.0
    momentum: 0.9
    sigmoidal_prob: False
    training_intervention_prob: 0.25
runs:
    - architecture: 'ConceptBottleneckModel'
      extra_name: "Sigmoid"
      sigmoidal_embedding: False
      training_intervention_prob: 0.25
      concept_loss_weight: 5
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True


    - architecture: 'ConceptBottleneckModel'
      extra_name: "Logit"
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: False

    - architecture: 'SequentialConceptBottleneckModel'
      extra_name: ""
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True
      c2y_max_epochs: 200

    - architecture: 'IndependentConceptBottleneckModel'
      extra_name: ""
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True
      c2y_max_epochs: 200

    - architecture: 'ConceptEmbeddingModel'
      extra_name: ""
      shared_prob_gen: True
      sigmoidal_prob: True
      sigmoidal_embedding: False
      training_intervention_prob: 0.25
      concat_prob: False
      embedding_activation: "leakyrelu"

    - architecture: "IntAwareConceptEmbeddingModel"
      extra_name: "_intervention_weight_{intervention_weight}"
      training_intervention_prob: 0.25
      horizon_binary_representation:  True
      include_task_trajectory_loss: True
      include_only_last_trajectory_loss: True
      task_loss_weight: 0
      intervention_weight: [5,1,0.1,0]
      intervention_task_loss_weight: 1
      initial_horizon: 2
      use_concept_groups: True
      use_full_mask_distr: False
      propagate_target_gradients: False
      int_model_use_bn: True
      int_model_layers: [128,128,64,64]
      intcem_task_loss_weight: 0
      embedding_activation: "leakyrelu"
      tau: 1
      max_horizon: 6
      horizon_uniform_distr: True
      beta_a: 1
      beta_b: 3
      intervention_task_discount: 1.1
      average_trajectory: True
      use_horizon: False
      initialize_discount: False
      model_pretrain_path: null
      horizon_rate: 1.005
      intervention_discount: 1
      legacy_mode: False
      grid_variables:
          - intervention_weight
      grid_search_mode: exhaustive