# @package _global_
model:
  name: Causal_CPC
  encoder:                              # Missing hyperparameters are to be filled in command line / with tune_hparams = True / selected with +backbone/crn_hparams=...
    _target_: src.models.causal_cpc.Causal_CPCEncoder
    # seq_hidden_units: 15                   # rnn_hidden_units in the original terminology
    br_size: 18
    fc_hidden_units: 18
    genc_hidden: 36
    context_latent_dim: 18
    downsampling_factor: 1
    subsample_win_ratio: 0.05
    dropout_rate: 0.1               # Dropout of LSTM hidden layers + output layers
    num_layer: 1

    use_causalconv: False
    input_channels: 1
    hidden_channels: 16
    kernel_size: 4
    dilation: 1

    batch_size: 64
    optimizer:
      lr_scheduler: False

      non_treatment_head: 
        optimizer_cls: adamw
        learning_rate: 0.005 # instead of 0.005
        weight_decay: 0.0000

      treatment_head:
        optimizer_cls: sgd
        learning_rate: 0.05 # instead of 0.005
        momentum: 0.9
        weight_decay: 0.0000
    
    
    use_attention: False


    tune_hparams: False                 # Hparam tuning
    tune_range: 50
    hparams_grid: 
    resources_per_trial:

  train_decoder: True

  decoder:                                # Missing hyperparameters are to be filled in command line / with tune_hparams = True / selected with +backbone/crn_hparams=...
    _target_: src.models.causal_cpc.Causal_CPCDecoder
    seq_hidden_units: 18                    # rnn_hidden_units in the original terminology
    br_size: 18
    fc_hidden_units: 18
    dropout_rate:  0.1                  # Dropout of LSTM hidden layers + output layers
    num_layer: 1
    batch_size: 1024
    y_dist_type: "continuous"
    teacher_forcing: False
    treat_hidden_dim: 12
    optimizer:
      lr_scheduler: False

      non_treatment_head:
        optimizer_cls: adamw
        learning_rate: 0.01 # instead of 0.005
        weight_decay: 0.0000

      treatment_head:
        optimizer_cls: sgd
        learning_rate: 0.05 # instead of 0.005
        momentum: 0.9
        weight_decay: 0.0000

    tune_hparams: False                   # Hparam tuning
    tune_range: 30
    hparams_grid:
    resources_per_trial:

exp:
  weights_ema: False
  balancing: mutual_info
  alpha_recons: 0.1
  alpha_infonce: 0.5
  alpha_mse: 10
  label_smoothing: 0
  use_spectral_norm: True

  encoder: 
    early_stopping: 
      monitor: "val/loss"
      min_delta : 0.0001
      patience: 15
      verbose: False
      mode: "min"
  
  decoder: 
    early_stopping: 
      monitor: "val/loss"
      min_delta : 0.0001
      patience: 10
      verbose: False
      mode: "min"




