{
    "_loaded_saveroot": null,
    "accumulation_steps": 1,
    "adw_norm_type": "l1mean",
    "bypass_type": "mild_pruning_W",
    "dataset_name": "benchmark_cifar100",
    "epsilon": 0.0002,
    "eval_batch_size": 128,
    "gamma": "2e-4*t",
    "git_hash": "8b6f5e60543d88cbe16484369cd34e87e7f5496a",
    "init_momentum": false,
    "input_shape": [
        3,
        32,
        32
    ],
    "loss": "categorical_crossentropy",
    "loss_args": {
        "reduction": "mean"
    },
    "metrics": [
        "accuracy",
        "categorical_crossentropy"
    ],
    "model_args": {},
    "model_build_verbose": true,
    "model_name": "cifar100_BypassVGG19",
    "np_seed": 827,
    "opt1_epoch": 500,
    "opt1_lr": 0.0001,
    "opt2_lr": 0.0001,
    "opt2_max": 2000,
    "optimizer_args": {
        "weight_decay": 0.0005,
        "momentum": 0.9
    },
    "optimizer_delta_args": {
        "weight_decay": 0
    },
    "optimizer_type": "sgd",
    "output_dims": 100,
    "prune_epsilon": "W_GMM",
    "prune_epsilon_args":{"n_components":2},
    "random_seed": 237,
    "save_period_epoch": null,
    "torch_seed": 29,
    "train1_epoch": 0,
    "train1_lr": 0.0001,
    "train3_epoch": 2300,
    "train3_lr": 0.0001,
    "train_batch_size": 128
}