defaults:
  - _self_
  - augmentations: symmetric.yaml
  - wandb: private.yaml
  - override hydra/hydra_logging: disabled
  - override hydra/job_logging: disabled

# disable hydra outputs
hydra:
  output_subdir: null
  run:
    dir: .

name: "vicreg-e2mc-imagenet-cpt"
method: "vicreg_e2mc"
backbone:
  name: "resnet50"

# CPT configuration: Path to the foreign checkpoint to resume from.
cpt_checkpoint_path: "backbones/vicreg_resnet50_fullckpt.pth" # always verify this path

# Training length: Assuming vicreg_resnet50_fullckpt.pth was trained for 1000 epochs,
# setting max_epochs to 1010 will train for exactly 10 more epochs.
max_epochs: 1010

method_kwargs:
  proj_hidden_dim: 8192
  proj_output_dim: 8192
  sim_loss_weight: 25.0
  var_loss_weight: 25.0
  cov_loss_weight: 1.0
  ent_loss_weight: 1000.0
  hypercov_loss_weight: 100.0
  epsilon: 1e-7
  add_projector_classifier: true

data:
  dataset: imagenet
  train_path: "/imagenet/train"
  val_path: "/imagenet/val"
  format: "image_folder"
  num_workers: 8
optimizer:
  name: "lars"
  batch_size: 256 # temprorily changed to 128
  lr: 0.003 # very small lr - with CPT
  classifier_lr: 0.1
  weight_decay: 1e-6
  kwargs:
    clip_lr: True
    eta: 0.02
    exclude_bias_n_norm: True
scheduler:
  name: "warmup_cosine"
  warmup_epochs: 1
checkpoint:
  enabled: True
  dir: "trained_models"
  frequency: 1
auto_resume:
  enabled: False

# overwrite PL stuff
devices: [0, 1]
sync_batchnorm: True
accelerator: "gpu"
strategy: "auto"
precision: 16-mixed
knn_eval:
  enabled: False # to avoid OOM
