{
    "_loaded_saveroot": null,
    "accumulation_steps": 4,
    "adw_norm_type": "l21",
    "bypass_type": "mild_pruning_W",
    "dataset_name": "imagenet",
    "delta_init" : "ConstantMultipleNorm(1,norm_p=2)",
    "epsilon": 0.000008,
    "eval_batch_size": 64,
    "gamma": "2.5e-4*(1+1/4*t)",
    "init_momentum": false,
    "input_shape": [
        3,
        224,
        224
    ],
    "loss": "categorical_crossentropy",
    "loss_args": {
        "label_smoothing": 0.1
    },
    "metrics": [
        "accuracy",
        "categorical_crossentropy"
    ],
    "mixup_args":{"mixup_preset":"snp"},
    "model_args": {},
    "model_build_verbose": true,
    "model_name": "imagenet_DeiTBase",
    "opt1_epoch": 20,
    "opt1_lr": 0.005,
    "opt1_scheduler_args": {"sched":"cosine"},
    "opt2_lr": 0.005,
    "opt2_scheduler_args": {"milestones":[25,30,35],"gamma":0.1},
    "opt2_max": 40,
    "optimizer_args": {
        "weight_decay": 0.0001,
        "momentum": 0.9
    },
    "optimizer_norm_args": {
        "weight_decay": 0,
        "momentum": 0.9
    },
    "optimizer_bias_args": {
        "weight_decay": 0,
        "momentum": 0.9
    },
    "optimizer_delta_args": {
        "weight_decay": 0
    },
    "optimizer_type": "sgd",
    "output_dims": 1000,
    "prune_epsilon": "C_1",
    "prune_epsilon_args":{"n_components":2},
    "random_seed": 237,
    "save_period_epoch": null,
    "train1_epoch": 0,
    "train1_lr": 0.0001,
    "train3_epoch": 75,
    "train3_lr": 0.005,
    "train3_scheduler_args": {"milestones":[65,70],"gamma":0.1},
    "train_batch_size": 64,
    "workers":8
}
