name: moco_v3-cifar-finetune-contrastive-eval
dataset: 
  name: cifar10
  image_size: 224
  aug_num: -1 # -1 is maximize, 1 means no augmentation
  max_dataset_size: 50000
  num_imagenet_classes: 1000
  imagenet_size: 50000
  num_workers: 8

model: 
  name: moco_v3:vit_base
  mean_std_name: imagenet
  moco_dim: 512 # feature dimension

train: null
  
eval: # linear evaluation, False will turn off automatic evaluation after training
  optimizer: 
    name: sgd
    weight_decay: 0.0005
    momentum: 0.9
  warmup_lr: 0
  warmup_epochs: 0
  base_lr: 0.06
  final_lr: 0
  batch_size: 256
  num_epochs: 200
  theta: 0.1

logger:
  tensorboard: False
  matplotlib: False

# two things might lead to stochastic behavior other than seed:
# worker_init_fn from dataloader and torch.nn.functional.interpolate 
# (keep this in mind if you want to achieve 100% deterministic)





