device: 'cuda'
amp: True
pin_memory: True
non_blocking: True
prefetch: False
num_workers: 4

dataset_path: '../data'
dataset: 'tiny'

checkpoint_load:
checkpoint_save:
log:

epochs: 200
batch_size: 128
lr: 0.01
lr_scheduler: ReduceLROnPlateau

client_optimizer: 'sgd'
sgd_momentum: 0.9 
wd: 5.0e-4
frequency_save: 0

te_epochs: 10
momentum: 0.9
weight_decay: 1.0e-4

beta1: 500
beta2: 1000
beta3: 1000
p: 2.0

teacher_model_loc:



