data_name: CIFAR100_x32
model_depth: 32
model_width: 4
model_style: FRN-Swish
model_name: FlaxResNet
optim_bs: 128
optim_ne: 50
optim_lr: 0.00025
optim_weight_decay: 0
beta: 0.5
beta2: 0.0001
droprate: 0
ema_decay: 0.99995
version: v1.1.8
T: 5
n_feat: 128
tag: AtoABC
fat: 1
feature_name: feature.layer1stride1
shared_head: False
sgd_state: True
crt: 1
cls_from_scratch: False
mixup_alpha: 0.4
forget: 6
linear_nose: True
start_temp: 2
ensemble_prediction: 3
dsc: True
input_scaling: 3
joint_depth: 6
width_multi: 2
centering: False
distill_alpha: 0.5