{
    "original": {},
    "retraining": {},
    "gd": {
        "training_arguments": {
            "num_train_epochs": 0.1
        }
    },
    "sgd": {
        "training_arguments": {
            "num_train_epochs": 1
        }
    },
    "ga": {
        "training_arguments": {
            "num_train_epochs": 1,
            "learning_rate": 5e-5
        }
    },
    "random_labels": {
        "training_arguments": {
            "num_train_epochs": 1,
            "learning_rate": 1e-5
        }
    },
    "scr_newton": {
        "training_arguments": {
            "num_train_epochs": 0.0001
        },
        "M": 60, 
        "num_outer_steps": 20,
        "grad_sample_size": 20,
        "hess_sample_size": 10,
        "num_inner_steps": 3,
        "learning_rate": 0.001
    },
    "scrub": {
        "training_arguments": {
            "num_train_epochs": 1,
            "per_device_train_batch_size": 10
        },
        "kd_T": 4,
        "distill": "kd",
        "msteps": 2,
        "gamma": 0.99,
        "alpha": 0.001,
        "beta": 0,
        "smoothing": 0.0,
        "clip": 0.2,
        "sstart": 10,
        "sgda_batch_size": 128,
        "del_batch_size": 32,
        "sgda_epochs": 1,
        "sgda_learning_rate": 0.0005,
        "lr_decay_epochs": [3,5,9],
        "lr_decay_rate": 0.1,
        "sgda_weight_decay": 5e-4,
        "sgda_momentum": 0.9
    }
}