defaults:
  - _self_
  - wandb: private.yaml
  - override hydra/hydra_logging: disabled
  - override hydra/job_logging: disabled

# disable hydra outputs
hydra:
  output_subdir: null
  run:
    dir: .

name: "radialvicreg-cifar100" # change here for cifar100
method: "radialvicreg"
backbone:
  name: "resnet18" 
method_kwargs:
 
  sim_loss_weight: 25.0
  var_loss_weight: 25.0
  cov_loss_weight: 1.0
  radial_loss_weight: 100
  radial_ent_loss_weight: 100
  projector_type: "mlp3"
  lambda_strategy: "standard"  # "standard" or "self_tune"
  add_projector_classifier: true # add this everywehere we want to log projector metrics as a method kwarg
  w1_radial_loss_weight: 0.0
  w1_target_num_samples: 512
  pre_projector_w1_loss_weight: 0.0

data:
  dataset: cifar100 # change here for cifar100
  train_path: "./datasets"
  val_path: "./datasets" #"datasets/imagenet100/val" - is this really correct? it seemed that the default was just ./datasets
  format: "image_folder"
  num_workers: 4

augmentations:
  - rrc:
      enabled: True
      crop_min_scale: 0.2
      crop_max_scale: 1.0
    color_jitter:
      enabled: True
      brightness: 0.4
      contrast: 0.4
      saturation: 0.2
      hue: 0.1
      prob: 0.8
    grayscale:
      enabled: True
      prob: 0.2
    gaussian_blur: #@KEEP IT AS IS FOR NOW - changeed just for CIFAR100 #IMP IMP IMP
      enabled: False
      prob: 0.0
    solarization:
      enabled: True
      prob: 0.1
    equalization:
      enabled: False
      prob: 0.0
    horizontal_flip:
      enabled: True
      prob: 0.5
    crop_size: 32
    num_crops: 2

optimizer:
  name: "lars"
  batch_size: 256
  lr: 0.3
  classifier_lr: 0.1 # this is also the LR for the MLP accuracy head - 0.1 is the standard it seems
  weight_decay: 1e-4
  kwargs:
    clip_lr: True
    eta: 0.02
    exclude_bias_n_norm: True

scheduler:
  name: "warmup_cosine"
checkpoint:
  enabled: True
  dir: "trained_models"
  frequency: 1
auto_resume:
  enabled: False

# overwrite PL stuff
max_epochs: 400 # 1000
devices: [0]
sync_batchnorm: True
accelerator: "gpu"
strategy: "ddp"
precision: 16-mixed

knn_eval:
  enabled: True # maybe should turn it off? on for better logging - it does indeed fail it seems

radius_hist:
  enabled: true
  max_snapshots: 50 # fire to see the transition - maybe in the future we can decrease it to more like 10 but for now 50 is good