defaults: # adds all the defaults from the other yaml files
  - _self_ 
  - augmentations: asymmetric.yaml
  - wandb: private.yaml
  - override hydra/hydra_logging: disabled
  - override hydra/job_logging: disabled

# disable hydra outputs
hydra:
  output_subdir: null
  run:
    dir: .

name: "radialmocov3-cpt-imagenet"
method: "radialmocov3"
backbone:
  name: "resnet50"


# CPT STUFF
# CPT configuration: Path to the foreign checkpoint to resume from.
cpt_checkpoint_path: "backbones/moco_resnet50_1000ep.pth.tar"

# Training length: Assuming moco_resnet50_1000ep.pth.tar was trained for 1000 epochs,
# setting max_epochs to 1010 will train for exactly 10 more epochs.
max_epochs: 1010 # 1000 + 10

momentum:
  base_tau: 0.99
  final_tau: 1.0


method_kwargs:
  proj_hidden_dim: 4096
  proj_output_dim: 256
  pred_hidden_dim: 4096
  temperature: 0.2
  radial_loss_weight: 0.01


data:
  dataset: imagenet
  train_path: "/imagenet/train"
  val_path: "/imagenet/val"
  format: "image_folder"
  num_workers: 16

# augmentations:
#   - # view 1
#     rrc:
#       enabled: True
#       crop_min_scale: 0.2
#       crop_max_scale: 1.0
#     color_jitter:
#       enabled: True
#       brightness: 0.4
#       contrast: 0.4
#       saturation: 0.2
#       hue: 0.1
#       prob: 0.8
#     grayscale:
#       enabled: True
#       prob: 0.2
#     gaussian_blur:
#       enabled: True
#       prob: 1.0
#     solarization:
#       enabled: False
#     equalization:
#       enabled: False
#     horizontal_flip:
#       enabled: True
#       prob: 0.5
#     crop_size: 224
#     num_crops: 1
#   - # view 2
#     rrc:
#       enabled: True
#       crop_min_scale: 0.2
#       crop_max_scale: 1.0
#     color_jitter:
#       enabled: True
#       brightness: 0.4
#       contrast: 0.4
#       saturation: 0.2
#       hue: 0.1
#       prob: 0.8
#     grayscale:
#       enabled: True
#       prob: 0.2
#     gaussian_blur:
#       enabled: True
#       prob: 0.1
#     solarization:
#       enabled: True
#       prob: 0.2
#     equalization:
#       enabled: False
#     horizontal_flip:
#       enabled: True
#       prob: 0.5
#     crop_size: 224
#     num_crops: 1


## FOR CPT change the optimizers things to be smaller LR etc
optimizer:
  name: "lars"
  batch_size: 256
  lr: 0.003
  classifier_lr: 0.1
  weight_decay: 1e-6
  kwargs:
    clip_lr: True
    eta: 0.02
    exclude_bias_n_norm: True
scheduler:
  name: "warmup_cosine"
  warmup_epochs: 1
checkpoint:
  enabled: True
  dir: "trained_models"
  frequency: 1
auto_resume:
  enabled: False

# overwrite PL stuff
devices: [0, 1]
sync_batchnorm: True
accelerator: "gpu"
strategy: "auto"
precision: 16-mixed

knn_eval:
  enabled: False # to avoid OOM
