defaults:
  - _self_
  - augmentations: symmetric.yaml
  - wandb: private.yaml
  - override hydra/hydra_logging: disabled
  - override hydra/job_logging: disabled

# disable hydra outputs
hydra:
  output_subdir: null
  run:
    dir: .

name: "radialvicreg-cpt-from-vicreg-imagenet"
method: "radialvicreg"
backbone:
  name: "resnet50"

# CPT configuration: Path to the foreign checkpoint to resume from.
cpt_checkpoint_path: "backbones/vicreg_resnet50_fullckpt.pth"

# Training length: Assuming vicreg_resnet50_fullckpt.pth was trained for 1000 epochs,
# setting max_epochs to 1010 will train for exactly 10 more epochs.
max_epochs: 1010

method_kwargs:
  proj_hidden_dim: 8192
  proj_output_dim: 8192
  sim_loss_weight: 25.0
  var_loss_weight: 25.0
  cov_loss_weight: 1.0
  radial_loss_weight: 0.0
  projector_type: "mlp"
  add_projector_classifier: true
data:
  dataset: imagenet
  train_path: "/imagenet/train"
  val_path: "/imagenet/val"
  format: "image_folder"
  num_workers: 16
optimizer:
  name: "lars"
  batch_size: 128 # paper uses 256 changed to 128 for 2 GPUs
  lr: 0.003
  classifier_lr: 0.1
  weight_decay: 1e-4
  kwargs:
    clip_lr: True
    eta: 0.02
    exclude_bias_n_norm: True
scheduler:
  name: "warmup_cosine"
  warmup_epochs: 1
checkpoint:
  enabled: True
  dir: "trained_models"
  frequency: 1
auto_resume:
  enabled: False

# overwrite PL stuff
devices: [0, 1]
sync_batchnorm: True
accelerator: "gpu"
strategy: "ddp"
precision: 16-mixed
knn_eval:
  enabled: False # add false to avoid OOM erros since at validation it would have to store all these dense embeddings in the ram 
