trials: 5
results_dir: results/intcbm_results
dataset: cub
num_workers: 8
batch_size: 128

# DATASET VARIABLES
root_dir: data/CUB200/
sampling_percent: 0.25
sampling_groups: True
test_subsampling: 0.5
skip_repr_evaluation: True


# Intervention Parameters
intervention_freq: 1
intervention_batch_size: 128
intervention_policies:
    - "group_random"
    - "group_random_no_prior"
    - "group_coop_no_prior"

max_epochs: 300
shared_params:
    top_k_accuracy: null
    save_model: True
    patience: 15
    emb_size: 16
    extra_dims: 0
    concept_loss_weight: 5
    learning_rate: 0.01
    weight_decay: 0.000004
    weight_loss: True
    c_extractor_arch: resnet34
    optimizer: sgd
    bool: False
    early_stopping_monitor: val_loss
    early_stopping_mode: min
    early_stopping_delta: 0.0
    momentum: 0.9
    sigmoidal_prob: False
    training_intervention_prob: 0.25

runs:
    - architecture: "IntAwareConceptBottleneckModel"
      extra_name: "Sigmoid_intervention_weight_{intervention_weight}"
      training_intervention_prob: 0.25
      horizon_binary_representation:  True
      include_task_trajectory_loss: True
      include_only_last_trajectory_loss: True
      task_loss_weight: 0
      intervention_weight: [1]
      intervention_task_loss_weight: 1
      initial_horizon: 2
      use_concept_groups: True # DIFF False
      use_full_mask_distr: False
      propagate_target_gradients: False
      int_model_use_bn: True
      int_model_layers: [128,128,64,64]
      intcem_task_loss_weight: 0
      embedding_activation: "leakyrelu"
      tau: 1
      max_horizon: 5
      horizon_uniform_distr: True
      beta_a: 1
      beta_b: 3
      intervention_task_discount: 1.1
      average_trajectory: True
      use_horizon: False
      initialize_discount: False
      model_pretrain_path: null
      horizon_rate: 1.005
      intervention_discount: 1
      legacy_mode: False
      grid_variables:
          - intervention_weight
      grid_search_mode: exhaustive
      sigmoidal_prob: True
      concept_loss_weight: 1

    - architecture: "ConceptBottleneckModel"
      extra_name: "Sigmoid_concept_loss_weight_1"
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: True
      concept_loss_weight: 1

    - architecture: "ConceptBottleneckModel"
      extra_name: "Logit_concept_loss_weight_1"
      sigmoidal_embedding: False
      concat_prob: False
      embedding_activation: "leakyrelu"
      bool: False
      extra_dims: 0
      sigmoidal_extra_capacity: False
      sigmoidal_prob: False
      concept_loss_weight: 1

    - architecture: "IntAwareConceptBottleneckModel"
      extra_name: "Logit_intervention_weight_{intervention_weight}"
      training_intervention_prob: 0.25
      horizon_binary_representation:  True
      include_task_trajectory_loss: True
      include_only_last_trajectory_loss: True
      task_loss_weight: 0
      intervention_weight: [1]
      intervention_task_loss_weight: 1
      initial_horizon: 2
      use_concept_groups: True
      use_full_mask_distr: False
      propagate_target_gradients: False
      int_model_use_bn: True
      int_model_layers: [128,128,64,64]
      intcem_task_loss_weight: 0
      embedding_activation: "leakyrelu"
      tau: 1
      max_horizon: 5
      horizon_uniform_distr: True
      beta_a: 1
      beta_b: 3
      intervention_task_discount: 1.1
      average_trajectory: True
      use_horizon: False
      initialize_discount: False
      model_pretrain_path: null
      horizon_rate: 1.005
      intervention_discount: 1
      legacy_mode: False
      grid_variables:
          - intervention_weight
      grid_search_mode: exhaustive
      sigmoidal_prob: False

    - architecture: 'ConceptEmbeddingModel'
      extra_name: ""
      shared_prob_gen: True
      sigmoidal_prob: True
      sigmoidal_embedding: False
      training_intervention_prob: 0.25
      concat_prob: False
      embedding_activation: "leakyrelu"

    - architecture: "IntAwareConceptEmbeddingModel"
      extra_name: "_intervention_weight_{intervention_weight}"
      training_intervention_prob: 0.25
      horizon_binary_representation:  True
      include_task_trajectory_loss: True
      include_only_last_trajectory_loss: True
      task_loss_weight: 0
      intervention_weight: [1]
      intervention_task_loss_weight: 1
      initial_horizon: 2
      use_concept_groups: True
      use_full_mask_distr: False
      propagate_target_gradients: False
      int_model_use_bn: True
      int_model_layers: [128,128,64,64]
      intcem_task_loss_weight: 0
      embedding_activation: "leakyrelu"
      tau: 1
      max_horizon: 5
      horizon_uniform_distr: True
      beta_a: 1
      beta_b: 3
      intervention_task_discount: 1.1
      average_trajectory: True
      use_horizon: False
      initialize_discount: False
      model_pretrain_path: null
      horizon_rate: 1.005
      intervention_discount: 1
      legacy_mode: False
      grid_variables:
          - intervention_weight
      grid_search_mode: exhaustive

