trials: 5
results_dir: results/mnist_add_incomp
dataset: mnist_add
num_workers: 8
batch_size: 2048
num_operands: 12
selected_digits:
  - [0,1,2]
  - [0,1,2]
  - [0,1,2]
  - [0,1,2]
  - [0,1,2,3,4]
  - [0,1,2,3,4]
  - [0,1,2,3,4]
  - [0,1,2,3,4]
  - [0,1,2,3,4,5,6,7,8,9]
  - [0,1,2,3,4,5,6,7,8,9]
  - [0,1,2,3,4,5,6,7,8,9]
  - [0,1,2,3,4,5,6,7,8,9]
threshold_labels: 30
noise_level: 0.0
max_epochs: 300
train_dataset_size: 10000
sampling_percent: 0.625
sampling_groups: True
c2y_layers: [128, 128]
skip_repr_evaluation: True

# Intervention Parameters
intervention_freq: 1
intervention_batch_size: 2048
intervention_policies:
    - "group_random"
    - "group_random_no_prior"
    - "group_coop_no_prior"
    - "behavioural_cloning_no_prior"
    - "group_uncertainty_no_prior"
    - "optimal_greedy_no_prior"
    - "global_val_error_no_prior"
    - "global_val_improvement_no_prior"

# DATASET VARIABLES
root_dir: data/mnist/
test_subsampling: 1
weight_loss: True
use_task_class_weights: True
check_val_every_n_epoch: 2

shared_params:
    top_k_accuracy: null
    save_model: True
    patience: 5
    emb_size: 16
    extra_dims: 0
    concept_loss_weight: 10
    learning_rate: 0.001
    weight_decay: 0.000004
    c_extractor_arch: resnet18
    optimizer: sgd
    bool: False
    early_stopping_monitor: val_loss
    early_stopping_mode: min
    early_stopping_delta: 0.0
    momentum: 0.9
    sigmoidal_prob: False
    training_intervention_prob: 0.25
runs:
    - architecture: 'ConceptBottleneckModel'
      extra_name: "Sigmoid_long"
      sigmoidal_embedding: False
      training_intervention_prob: 0.25
      concept_loss_weight: 5
      max_epochs: 500
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True

    - architecture: 'ConceptBottleneckModel'
      extra_name: "Logit_long"
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: False
      max_epochs: 500

    - architecture: 'SequentialConceptBottleneckModel'
      extra_name: "_long"
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True
      c2y_max_epochs: 200

    - architecture: 'IndependentConceptBottleneckModel'
      extra_name: "_long"
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True
      max_epochs: 300

    - architecture: "IntAwareConceptEmbeddingModel"
      extra_name: "Retry_intervention_weight_{intervention_weight}_horizon_rate_{horizon_rate}_intervention_discount_{intervention_discount}_task_discount_{intervention_task_discount}"
      training_intervention_prob: 0.25
      horizon_binary_representation:  True
      include_task_trajectory_loss: True
      include_only_last_trajectory_loss: True
      task_loss_weight: 0
      intervention_weight: [5,1,0.1,0]
      intervention_task_loss_weight: 1
      initial_horizon: 2
      use_concept_groups: True # DIFF False
      use_full_mask_distr: False
      propagate_target_gradients: False
      int_model_use_bn: True
      int_model_layers: [128,128,64,64]
      intcem_task_loss_weight: 0
      embedding_activation: "leakyrelu"
      tau: 1
      max_horizon: 6
      horizon_uniform_distr: True
      beta_a: 1
      beta_b: 3
      intervention_task_discount: [1.5, 1.1]
      average_trajectory: True
      use_horizon: False # DIFF True
      initialize_discount: False
      model_pretrain_path: null
      horizon_rate: 1.005
      intervention_discount: 1
      legacy_mode: False # Diff True
      grid_variables:
          - intervention_task_discount
          - intervention_weight
      grid_search_mode: exhaustive


    - architecture: 'ConceptEmbeddingModel'
      extra_name: ""
      shared_prob_gen: True
      sigmoidal_prob: True
      sigmoidal_embedding: False
      training_intervention_prob: 0.25
      concat_prob: False
      embedding_activation: "leakyrelu"

    - architecture: "IntAwareConceptEmbeddingModel"
      extra_name: "LastOnly_intervention_weight_{intervention_weight}_horizon_rate_{horizon_rate}_intervention_discount_{intervention_discount}_tau_{tau}_max_horizon_{max_horizon}_task_discount_{intervention_task_discount}_uniform_distr_{uniform_distr}_no_horizon"
      horizon_binary_representation:  True
      include_task_trajectory_loss: True
      include_only_last_trajectory_loss: True
      average_trajectory: False #True
      task_loss_weight: 0
      use_concept_groups: True
      embedding_activation: "leakyrelu"
      tau: 1
      max_horizon: 13
      uniform_distr: True
      beta_a: 1
      beta_b: 3
      use_horizon: False
      model_pretrain_path: null
      pretrain_intcem: False
      intervention_weight: [5,1,0.1]
      initial_horizon: 2
      include_probs: False
      use_full_mask_distr: True
      int_model_use_bn: True
      int_model_layers: [128,128,64,64]
      intervention_discount: 1.05
      horizon_rate: 1
      intcem_task_loss_weight: 0
      intervention_task_discount: 1.05
      intervention_task_loss_weight: 1
      initialize_discount: True
      training_intervention_prob: 0.25
      propagate_target_gradients: True
      num_rollouts: [1]
      grid_variables:
          - intervention_weight
          - num_rollouts
      grid_search_mode: exhaustive

    - architecture: 'ConceptBottleneckModel'
      extra_name: "Sigmoid"
      sigmoidal_embedding: False
      training_intervention_prob: 0.25
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True

    # - architecture: 'ConceptBottleneckModel'
    #   extra_name: "Sigmoid_concept_loss_weight_{concept_loss_weight}"
    #   sigmoidal_embedding: False
    #   training_intervention_prob: 0.25
    #   concat_prob: False
    #   embedding_activation: "leakyrelu"
    #   bool: False
    #   extra_dims: 0
    #   concept_loss_weight: [0.1, 1, 5]
    #   sigmoidal_extra_capacity: False
    #   sigmoidal_prob: True
    #   grid_variables:
    #       - concept_loss_weight
    #   grid_search_mode: exhaustive

    - architecture: 'ConceptBottleneckModel'
      extra_name: "Logit"
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: False


    - architecture: 'SequentialConceptBottleneckModel'
      extra_name: ""
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True

    - architecture: 'IndependentConceptBottleneckModel'
      extra_name: ""
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True
