experiment_name: "CLTSPRETraining"
experiment: "metrics" # other values are gan and diffusion

defaults:
  - override hydra/launcher: joblib
hydra:
  launcher:
    n_jobs: 2
   
work_dir: ${hydra:runtime.cwd}
base_path: ""
save_path: "${experiment_name}/"
mlflow_folder: "${base_path}/mlflow"


seed: 42 
device: "cuda"  
num_workers: 8

dataset_name: "air_quality"
dataloader_file: general_pl_dataloader
dataloader_model: TimeweaverDataLoader
cltsp_name: "cltsp_v3"
model_file: cltsp
model_name: CLTSPTrainer 
  
save_key: val_loss
should_compile_torch: True  
store_intermediate_checkpoints: False

######################### GENERAL DATASET CONFIG ########################################
dataset: 
  train_test_split: 0.8
  batch_size: 256
  num_workers: 8

######################## SPECIFIC DATASET CONFIG ########################################

waveforms_dataset:
  num_channels: 1
  time_series_length: 96
  required_time_series_length: 64
  log_dir: ""
  num_discrete_labels: 4
  num_discrete_conditions: 1
  num_continuous_labels: 3
  discrete_condition_embedding_dim: 128
  latent_dim: 48

traffic_dataset:
  num_channels: 1 
  time_series_length: 96
  required_time_series_length: 64
  log_dir: ""
  num_discrete_labels: 135
  num_discrete_conditions: 7
  num_continuous_labels: 4
  discrete_condition_embedding_dim: 128
  latent_dim: 48 

air_quality_dataset:
  num_channels: 6
  time_series_length: 96
  required_time_series_length: 64
  log_dir: ""
  num_discrete_labels: 101 
  num_discrete_conditions: 6
  num_continuous_labels: 5
  discrete_condition_embedding_dim: 128
  latent_dim: 128

stocks_dataset:
  num_channels: 6 
  time_series_length: 96
  required_time_series_length: 64
  log_dir: ""
  num_discrete_labels: 0 
  num_discrete_conditions: 0
  num_continuous_labels: 0 
  discrete_condition_embedding_dim: 128
  latent_dim: 128
  
########################### CLTSP CONFIGS ########################################
cltsp_v3_config:  
    d_model: 128
    d_keys: 8
    d_values: 8
    n_heads: 8
    num_encoder_layers: 8
    num_compression_layers: 1
    d_ff: 2048
    dropout: 0.05
    activation: "gelu"
    num_positive_samples: 2
    discrete_condition_embedding_dim: 128

########################### TRAINING CONFIG ########################################
 
training:
    max_epochs: 5000
    learning_rate: 1e-4
    save_after_every_iters: 100
    auto_lr_find: True
    check_val_every_n_epoch: 10
    save_after_every_n_epochs: 100
    log_every_n_steps: 1
    num_devices: 1
    # strategy: "ddp_find_unused_parameters_true"
    strategy: "auto"
    temperature: 1.0
    use_clip_loss: true
    use_condition_scl_loss: false
    use_timeseries_scl_loss: false

supervised_contrastive_learning:
    temperature: 0.07 
    base_temperature: 0.07
    contrast_mode: "all"
    


model_str: "${cltsp_v3_config.d_model}_${cltsp_v3_config.num_encoder_layers}_${cltsp_v3_config.num_compression_layers}"
run_name: "${model_str}_${dataset_name}_metrics_use_clip_loss_${training.use_clip_loss}_use_condition_scl_loss_${training.use_condition_scl_loss}_use_timeseries_scl_loss_${training.use_timeseries_scl_loss}"