[INFO]
num_nodes = 2
gpus_per_node = 4
cpus_per_gpu = 12
prefetch_factor = 2
precision = 16-mixed
fix_random_seed = no
strategy = ddp
if_profile = no

[DATA]
dataset = IMAGENET1K
n_views = 4
n_trans = 2
augmentation_package = albumentations
augmentations = RandomResizedCrop,GaussianBlur,RandomGrayscale,ColorJitter,RandomHorizontalFlip,RandomSolarize
crop_size = 224,224
crop_min_scale = 0.08,0.08
crop_max_scale = 1.0,1.0
hflip_prob = 0.5,0.5
blur_kernel_size = 23,23
blur_prob = 1.0,0.1
grayscale_prob = 0.2,0.2
jitter_brightness = 0.4,0.4
jitter_contrast = 0.4,0.4
jitter_saturation = 0.2,0.2
jitter_hue = 0.1,0.1
jitter_prob = 0.8,0.8
solarize_prob = 0.0,0.2
imagenet_train_dir = /imagenet/train # location for the imagenet-1K dataset
imagenet_val_dir = /imagenet/val  # location for the imagenet-1K dataset

[SSL]
backbone = resnet50
use_projection_head = yes
proj_dim = 8192,8192
proj_out_dim = 512
optimizer = LARS
lr = 1.1
lr_scale = linear
lr_scheduler = cosine-warmup
momentum = 0.9
weight_decay = 1e-6
exclude_bn_bias_from_weight_decay = yes
lars_eta = 0.001
loss_function = LogRepulsiveEllipsoidPackingLossUnitNorm
lw0 = 0.0
lw1 = 1.0
lw2 = 0.0
rs = 8.5
pot_pow = 2.0
warmup_epochs = 10
n_epochs = 100
batch_size = 512
save_every_n_epochs = 10
skip_validation = yes

[LC]
output_dim = 1000
optimizer = SGD
use_batch_norm = no
lr_sweep = 0.8,1.2,1.6
lr_scale = linear
lr_scheduler = cosine
weight_decay = 1e-6
momentum = 0.9
loss_function = CrossEntropyLoss
n_epochs = 100
batch_size = 2048
save_every_n_epochs = 25

[SemiSL]
loss_function = CrossEntropyLoss
apply_simple_augmentations = yes
standardize_to_imagenet = yes
optimizer = SGD
lr_sweep = 0.1,0.2,0.4,0.6,0.8
lr_scale = linear
backbone_lr_slowdown = 0.05 # lr for the backbone = lr*backbone_lr_slowdown
lr_scheduler = cosine
momentum = 0.9
weight_decay = 0.0
n_epochs = 20
batch_size = 256
save_every_n_epochs = 10
skip_validation = yes
apply_simple_augmentations = yes # crop center + horizontal flip
standardize_to_imagenet = yes
skip_validation = yes
