experiment_name: torch_vct
seed: 202208

ngpu: 1
num_workers_per_task: 1

user: ${oc.env:USER} # oc=omegaconf

defaults:
  - _self_
  - analysis_transform: movie 
  - synthesis_transform: movie 
  - datamodule: vimeo
  - optim: adamw
  - scheduler: linearrampcosine 
  - test_datamodule: uvg

model:
  _target_: model_pipeline.MoVieipeline
  analysis_transform: ${analysis_transform}
  synthesis_transform: ${synthesis_transform}
  compression_channels: 192


training_loop:
  learning_rate: 2e-4
  lr_annealing_frequency: ${checkpoint.callback.every_n_train_steps}
  distortion_lambda: 0.0035
  train_batch_size: 4
  val_batch_size: 4
  pseudo_epochs: ${eval:${trainer.max_steps}//${training_loop.lr_annealing_frequency}} 

# logging configs
checkpoint:
  overwrite: False # overwrite logs already in training dir
  resume_training: True # resume training from previous logs
  callback: # passed to PyTorch Lightning's ModelCheckpoint callback
    dirpath: checkpoints
    save_top_k: 2
    monitor: val_combined_loss_weighted
    mode: min
    save_last: True
    every_n_train_steps: 2000 # also equals annealing freq and val evaluation


# These args are passed to the PyTorch Lightning Trainer - add extra customization here
trainer: 
  # Steps, dev runs etc 
  fast_dev_run: False # Default=False; if int runs n steps of train/val ~ unit test
  max_steps: 1_000_000      # test step in paper
  log_every_n_steps: 100   # default=50
  # ---
  # Validation: validate every time checkpoint is stored
  val_check_interval: ${checkpoint.callback.every_n_train_steps} # default is 1.0
  check_val_every_n_epoch: # None = disable epoch validation, validate every <val_check_interval> steps 
  limit_val_batches: 10    # Use <limit_val_batches> instead of the whole validation set
  # ---
  # Devices
  devices: ${ngpu}  
  accelerator: gpu 
  gradient_clip_val: 1.0
  gradient_clip_algorithm: norm

tester:
  accelerator: gpu 
  devices: 1

logger: 
  entity: 
  project: torch_vct
  group: dev

hydra:
  run:
    dir: output/${now:%Y-%m-%d}/${now:%H-%M-%S}
  sweep:
    dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
  job:
    config:
      override_dirname:
        exclude_keys:
          - mode
          - experiment_name
          - hydra.launcher.timeout_min
