defaults:
  - _self_
  - augmentations: symmetric.yaml
  - wandb: private.yaml
  - override hydra/hydra_logging: disabled
  - override hydra/job_logging: disabled

# disable hydra outputs
hydra:
  output_subdir: null
  run:
    dir: .

name: "nat-cifar100" # change here for cifar100
method: "nat"
backbone:
  name: "resnet18"
method_kwargs:
  proj_hidden_dim: 2048
  proj_output_dim: 256
  update_freq: 3                # frequency to update assignments (in epochs)
  # Auxiliary loss settings (for logging by default)
  variance_lambda: 0.1          # Weight if optimize_variance is true
  optimize_variance: false      # Set to true to add variance loss to total_loss
  covariance_lambda: 0.1        # Weight if optimize_covariance is true
  optimize_covariance: false    # Set to true to add covariance loss to total_loss
  radial_lambda: 0.1            # Weight if optimize_radial is true
  optimize_radial: false        # Set to true to add radial loss to total_loss
  lambda_strategy: "standard"   # "standard" or "self_tune"
  add_projector_classifier: true # Add projector classifier for evaluation
data:
  dataset: cifar100 # change here for cifar100
  dataset_size: 50000 # Added for fallback in NAT setup - the dataset size for CIFAR100 is 50000
  train_path: "./datasets"
  val_path: "./datasets"
  format: "image_folder"
  num_workers: 4
optimizer:
  name: "lars"
  batch_size: 256 # the same as YAML so the uniformity loss values should be comparable
  lr: 0.5
  classifier_lr: 0.1
  weight_decay: 1e-4
  kwargs:
    clip_lr: True
    eta: 0.02
    exclude_bias_n_norm: True
scheduler:
  name: "warmup_cosine"
checkpoint:
  enabled: True
  dir: "trained_models"
  frequency: 1
auto_resume:
  enabled: True

# overwrite PL stuff
max_epochs: 300 # 1000
devices: [0]
sync_batchnorm: True
accelerator: "gpu"
strategy: "ddp"
precision: 16-mixed
knn_eval:
  enabled: True