aa: rand-m9-n1-mstd0.4-inc1
amp: true
apex_amp: false
aug_splits: 0
batch_size: 64
bn_eps: null
bn_momentum: null
bn_tf: false
channels_last: false
checkpoint_hist: 10
clip_grad: null
clip_mode: norm
color_jitter: 0.0
cooldown_epochs: 10
crop_pct: 1.0
cutmix: 0.5
cutmix_minmax: null
data_dir: /home/luyj/data/cifar-100-python
dataset: torch/cifar100
decay_epochs: 30
decay_rate: 0.1
dim: 384
dist_bn: ''
drop: 0.0
drop_block: null
drop_connect: null
drop_path: null
epoch_repeats: 0.0
epochs: 300
eval_metric: top1
experiment: ''
gp: null
hflip: 0.5
img_size: 32
initial_checkpoint: ''
input_size: null
interpolation: bicubic
jsd: false
layer: 4
local_rank: 0
log_interval: 1000
log_wandb: false
lr: 0.005
lr_cycle_limit: 1
lr_cycle_mul: 1.0
lr_noise: null
lr_noise_pct: 0.67
lr_noise_std: 1.0
mean:
- 0.4914
- 0.4822
- 0.4465
min_lr: 1.0e-07
mixup: 0.5
mixup_mode: batch
mixup_off_epoch: 200
mixup_prob: 1.0
mixup_switch_prob: 0.5
mlp_ratio: 4
model: stmixerv3
model_ema: false
model_ema_decay: 0.9998
model_ema_force_cpu: false
momentum: 0.9
native_amp: false
no_aug: false
no_prefetcher: false
no_resume_opt: false
num_classes: 100
num_heads: 12
opt: adamw
opt_betas: null
opt_eps: null
output: ''
patch_size: 4
patience_epochs: 10
pin_mem: false
pretrained: false
ratio:
- 1.0
- 1.0
recount: 1
recovery_interval: 0
remode: const
reprob: 0.25
resplit: false
resume: ''
save_images: false
scale:
- 1.0
- 1.0
sched: cosine
seed: 2025
smoothing: 0.01
split_bn: false
start_epoch: null
std:
- 0.247
- 0.2435
- 0.2616
sync_bn: false
time_step: 4
torchscript: false
train_interpolation: bicubic
train_split: train
tta: 0
use_multi_epochs_loader: false
val_batch_size: 64
val_split: validation
vflip: 0.0
warmup_epochs: 20
warmup_lr: 0.0001
weight_decay: 0.06
workers: 8
