{"Epoch": 0, "Epoch-Time": 239.03329515457153, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.47000122070312, "Augmented-0.05-Quantile-Accuracy": 96.68999481201172, "Augmented-0.1-Quantile-Accuracy": 97.13999938964844, "Augmented-Accuracy": 98.0742, "Augmented-Loss": 0.20319050607967376, "Clean-Accuracy": 98.25, "Clean-Loss": 0.13825700964927673, "PGD-Accuracy": 0.52, "PGD-Loss": 4.459980114746093}, "Total-Time": 239.03329515457153, "Train": {"Loss": 1.1213170847186336, "avg t": 0.9438527506722344, "plain loss": 0.41980300474520144, "standard loss": 0.3416596777704027}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.58333587646484, "Augmented-0.05-Quantile-Accuracy": 97.36666870117188, "Augmented-0.1-Quantile-Accuracy": 97.63333129882812, "Augmented-Accuracy": 98.54633333333334, "Augmented-Loss": 0.18561800723473232, "Clean-Accuracy": 98.8, "Clean-Loss": 0.12479806081453959, "PGD-Accuracy": 0.4166666666666667, "PGD-Loss": 4.464552675882976}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 1, "Epoch-Time": 203.95857524871826, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.88999938964844, "Augmented-0.05-Quantile-Accuracy": 97.72000122070312, "Augmented-0.1-Quantile-Accuracy": 98.04000091552734, "Augmented-Accuracy": 98.7479, "Augmented-Loss": 0.18177881755924225, "Clean-Accuracy": 98.84, "Clean-Loss": 0.11261270513534546, "PGD-Accuracy": 1.47, "PGD-Loss": 4.464981671142578}, "Total-Time": 442.9918704032898, "Train": {"Loss": 0.9777934188312954, "avg t": 0.9281721116171943, "plain loss": 0.2637621921821879, "standard loss": 0.18330151225019384}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.4000015258789, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.28333282470703, "Augmented-Accuracy": 98.8335, "Augmented-Loss": 0.17257051164786022, "Clean-Accuracy": 98.9, "Clean-Loss": 0.10698350111643473, "PGD-Accuracy": 1.7666666666666666, "PGD-Loss": 4.449163281758627}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 2, "Epoch-Time": 227.3399612903595, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.5199966430664, "Augmented-0.05-Quantile-Accuracy": 96.83999633789062, "Augmented-0.1-Quantile-Accuracy": 97.27999877929688, "Augmented-Accuracy": 98.2909, "Augmented-Loss": 0.24400159599018098, "Clean-Accuracy": 98.55, "Clean-Loss": 0.1741086398124695, "PGD-Accuracy": 2.0, "PGD-Loss": 5.998168054199219}, "Total-Time": 670.3318316936493, "Train": {"Loss": 0.9617926333038895, "avg t": 0.926034863754555, "plain loss": 0.22841231387103048, "standard loss": 0.15985724708769056}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.19999694824219, "Augmented-0.05-Quantile-Accuracy": 97.3499984741211, "Augmented-0.1-Quantile-Accuracy": 97.66666412353516, "Augmented-Accuracy": 98.45566666666667, "Augmented-Loss": 0.22744331452290217, "Clean-Accuracy": 98.73333333333333, "Clean-Loss": 0.16144019055366515, "PGD-Accuracy": 2.183333333333333, "PGD-Loss": 6.032513951619467}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 3, "Epoch-Time": 241.21174216270447, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.8699951171875, "Augmented-0.05-Quantile-Accuracy": 97.86000061035156, "Augmented-0.1-Quantile-Accuracy": 98.20999908447266, "Augmented-Accuracy": 98.8886, "Augmented-Loss": 0.1085724809858799, "Clean-Accuracy": 99.04, "Clean-Loss": 0.07559287103414536, "PGD-Accuracy": 2.1, "PGD-Loss": 6.90851796875}, "Total-Time": 911.5435738563538, "Train": {"Loss": 0.9549582923959803, "avg t": 0.924938831558934, "plain loss": 0.20057837443881552, "standard loss": 0.14731919537650215}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.3499984741211, "Augmented-0.1-Quantile-Accuracy": 98.53333282470703, "Augmented-Accuracy": 98.941, "Augmented-Loss": 0.10103813583711783, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.07207688454786937, "PGD-Accuracy": 2.4166666666666665, "PGD-Loss": 6.916969599405925}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 4, "Epoch-Time": 241.17919635772705, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.0999984741211, "Augmented-0.05-Quantile-Accuracy": 97.8499984741211, "Augmented-0.1-Quantile-Accuracy": 98.11000061035156, "Augmented-Accuracy": 98.9125, "Augmented-Loss": 0.120588704018116, "Clean-Accuracy": 99.01, "Clean-Loss": 0.09075730106830597, "PGD-Accuracy": 5.13, "PGD-Loss": 6.34272419128418}, "Total-Time": 1152.7227702140808, "Train": {"Loss": 0.9499116776077836, "avg t": 0.9242620219124688, "plain loss": 0.17957455398418298, "standard loss": 0.1319550086370221}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.5999984741211, "Augmented-0.05-Quantile-Accuracy": 98.26666259765625, "Augmented-0.1-Quantile-Accuracy": 98.51666259765625, "Augmented-Accuracy": 98.97833333333334, "Augmented-Loss": 0.11007207670966784, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.0837799077630043, "PGD-Accuracy": 5.25, "PGD-Loss": 6.278943478902181}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 5, "Epoch-Time": 241.33213257789612, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.1199951171875, "Augmented-0.05-Quantile-Accuracy": 97.93999481201172, "Augmented-0.1-Quantile-Accuracy": 98.3699951171875, "Augmented-Accuracy": 98.9476, "Augmented-Loss": 0.140279715010643, "Clean-Accuracy": 99.09, "Clean-Loss": 0.10817413611412048, "PGD-Accuracy": 5.48, "PGD-Loss": 6.7369577575683595}, "Total-Time": 1394.054902791977, "Train": {"Loss": 0.9469121863753708, "avg t": 0.9237421856632939, "plain loss": 0.16681616422158688, "standard loss": 0.12393662680961468}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.54999542236328, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.48332977294922, "Augmented-Accuracy": 98.97566666666667, "Augmented-Loss": 0.12964646615624428, "Clean-Accuracy": 99.05, "Clean-Loss": 0.09982363899548849, "PGD-Accuracy": 5.5, "PGD-Loss": 6.599804626464843}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 6, "Epoch-Time": 209.13998103141785, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.32999420166016, "Augmented-0.05-Quantile-Accuracy": 98.11000061035156, "Augmented-0.1-Quantile-Accuracy": 98.3699951171875, "Augmented-Accuracy": 99.002, "Augmented-Loss": 0.08857066383314133, "Clean-Accuracy": 99.15, "Clean-Loss": 0.06541236379146576, "PGD-Accuracy": 4.85, "PGD-Loss": 7.665491528320312}, "Total-Time": 1603.1948838233948, "Train": {"Loss": 0.9445861374183937, "avg t": 0.923379982135914, "plain loss": 0.15865948469727134, "standard loss": 0.11892938325581727}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.4000015258789, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.056, "Augmented-Loss": 0.08537732235570748, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.0653796684940656, "PGD-Accuracy": 4.816666666666666, "PGD-Loss": 7.571072306315104}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 7, "Epoch-Time": 214.61931705474854, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.29000091552734, "Augmented-0.05-Quantile-Accuracy": 97.95999908447266, "Augmented-0.1-Quantile-Accuracy": 98.29999542236328, "Augmented-Accuracy": 98.9897, "Augmented-Loss": 0.07980783574604988, "Clean-Accuracy": 99.11, "Clean-Loss": 0.06251920506954194, "PGD-Accuracy": 4.89, "PGD-Loss": 7.643169924926758}, "Total-Time": 1817.8142008781433, "Train": {"Loss": 0.94321704949273, "avg t": 0.9231416854151973, "plain loss": 0.14765582744457112, "standard loss": 0.109606129569036}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.4000015258789, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.08316666666667, "Augmented-Loss": 0.07488301510194938, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.06039453308780988, "PGD-Accuracy": 5.266666666666667, "PGD-Loss": 7.574060221354166}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 8, "Epoch-Time": 241.34305930137634, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.97000122070312, "Augmented-0.05-Quantile-Accuracy": 98.02999877929688, "Augmented-0.1-Quantile-Accuracy": 98.25999450683594, "Augmented-Accuracy": 98.932, "Augmented-Loss": 0.13423488643932344, "Clean-Accuracy": 98.98, "Clean-Loss": 0.09897055430412292, "PGD-Accuracy": 11.1, "PGD-Loss": 6.469717953491211}, "Total-Time": 2059.1572601795197, "Train": {"Loss": 0.9418547926655522, "avg t": 0.9228775393344738, "plain loss": 0.13726251381768123, "standard loss": 0.10191857750548257}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.6500015258789, "Augmented-0.05-Quantile-Accuracy": 98.31666564941406, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.0085, "Augmented-Loss": 0.12221801956017812, "Clean-Accuracy": 99.05, "Clean-Loss": 0.09118959059317906, "PGD-Accuracy": 10.8, "PGD-Loss": 6.414572545369466}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 9, "Epoch-Time": 241.42344617843628, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.32999420166016, "Augmented-0.05-Quantile-Accuracy": 98.04000091552734, "Augmented-0.1-Quantile-Accuracy": 98.31999969482422, "Augmented-Accuracy": 98.9665, "Augmented-Loss": 0.07364146750700473, "Clean-Accuracy": 99.04, "Clean-Loss": 0.05763043994903565, "PGD-Accuracy": 3.22, "PGD-Loss": 8.470935247802734}, "Total-Time": 2300.580706357956, "Train": {"Loss": 0.941213198573501, "avg t": 0.9227553694866322, "plain loss": 0.13338378764964925, "standard loss": 0.09947964856138936}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.93333435058594, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.12533333333333, "Augmented-Loss": 0.06836461757183075, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.0549897787074248, "PGD-Accuracy": 3.466666666666667, "PGD-Loss": 8.334766301472982}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 10, "Epoch-Time": 241.29705476760864, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.30999755859375, "Augmented-0.05-Quantile-Accuracy": 98.02999877929688, "Augmented-0.1-Quantile-Accuracy": 98.29000091552734, "Augmented-Accuracy": 98.9825, "Augmented-Loss": 0.0766401893620491, "Clean-Accuracy": 99.11, "Clean-Loss": 0.05693345335721969, "PGD-Accuracy": 3.72, "PGD-Loss": 8.639303387451172}, "Total-Time": 2541.8777611255646, "Train": {"Loss": 0.9404589783350626, "avg t": 0.9226195017673351, "plain loss": 0.12853736222585055, "standard loss": 0.0949098810641854}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.04999542236328, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.035, "Augmented-Loss": 0.07390323124080897, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.05799202361702919, "PGD-Accuracy": 3.9166666666666665, "PGD-Loss": 8.641291585286458}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 11, "Epoch-Time": 239.52335596084595, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.08999633789062, "Augmented-0.05-Quantile-Accuracy": 97.89999389648438, "Augmented-0.1-Quantile-Accuracy": 98.22000122070312, "Augmented-Accuracy": 98.94, "Augmented-Loss": 0.10946493741178513, "Clean-Accuracy": 99.04, "Clean-Loss": 0.08523751242160797, "PGD-Accuracy": 12.32, "PGD-Loss": 7.053729855346679}, "Total-Time": 2781.4011170864105, "Train": {"Loss": 0.9402412228937502, "avg t": 0.9225759546138622, "plain loss": 0.12838432352984394, "standard loss": 0.09563894979379796}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.56666564941406, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.51666259765625, "Augmented-Accuracy": 98.99783333333333, "Augmented-Loss": 0.10269745498677095, "Clean-Accuracy": 99.1, "Clean-Loss": 0.08152413417895635, "PGD-Accuracy": 12.783333333333333, "PGD-Loss": 6.927281865437825}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 12, "Epoch-Time": 202.10785245895386, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.25999450683594, "Augmented-0.05-Quantile-Accuracy": 98.05999755859375, "Augmented-0.1-Quantile-Accuracy": 98.3499984741211, "Augmented-Accuracy": 98.986, "Augmented-Loss": 0.07930901254367828, "Clean-Accuracy": 99.07, "Clean-Loss": 0.06690065549612045, "PGD-Accuracy": 3.89, "PGD-Loss": 8.936483068847656}, "Total-Time": 2983.5089695453644, "Train": {"Loss": 0.9398915399268821, "avg t": 0.922490033255683, "plain loss": 0.12598109165827437, "standard loss": 0.10165326684934121}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.06366666666666, "Augmented-Loss": 0.07532981908122699, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.06485878556966782, "PGD-Accuracy": 3.7, "PGD-Loss": 8.863058008829753}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 13, "Epoch-Time": 228.65731954574585, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.05999755859375, "Augmented-0.05-Quantile-Accuracy": 98.0199966430664, "Augmented-0.1-Quantile-Accuracy": 98.31999969482422, "Augmented-Accuracy": 99.0012, "Augmented-Loss": 0.09829093023085594, "Clean-Accuracy": 99.08, "Clean-Loss": 0.07211927881240844, "PGD-Accuracy": 10.31, "PGD-Loss": 6.726900970458984}, "Total-Time": 3212.1662890911102, "Train": {"Loss": 0.9398870420279326, "avg t": 0.9224742954572042, "plain loss": 0.12187289600725525, "standard loss": 0.09937137605967344}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.33333587646484, "Augmented-0.1-Quantile-Accuracy": 98.56666564941406, "Augmented-Accuracy": 99.01916666666666, "Augmented-Loss": 0.09258039843539397, "Clean-Accuracy": 99.05, "Clean-Loss": 0.06995491518576939, "PGD-Accuracy": 10.1, "PGD-Loss": 6.603432614644369}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 14, "Epoch-Time": 241.4134418964386, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.3699951171875, "Augmented-0.05-Quantile-Accuracy": 98.13999938964844, "Augmented-0.1-Quantile-Accuracy": 98.48999786376953, "Augmented-Accuracy": 99.0469, "Augmented-Loss": 0.08861167699837684, "Clean-Accuracy": 99.15, "Clean-Loss": 0.07167426207065582, "PGD-Accuracy": 9.63, "PGD-Loss": 7.632462518310547}, "Total-Time": 3453.579730987549, "Train": {"Loss": 0.9396551839687206, "avg t": 0.9224146896291662, "plain loss": 0.12339764796009779, "standard loss": 0.09721030391145635}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.78333282470703, "Augmented-0.05-Quantile-Accuracy": 98.48332977294922, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.11333333333333, "Augmented-Loss": 0.08238044920166333, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.06791580359141032, "PGD-Accuracy": 9.9, "PGD-Loss": 7.513287556966146}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 15, "Epoch-Time": 241.25288677215576, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.5, "Augmented-0.05-Quantile-Accuracy": 98.18000030517578, "Augmented-0.1-Quantile-Accuracy": 98.48999786376953, "Augmented-Accuracy": 99.0622, "Augmented-Loss": 0.0648999345742464, "Clean-Accuracy": 99.14, "Clean-Loss": 0.053434787154197694, "PGD-Accuracy": 6.06, "PGD-Loss": 8.667275915527343}, "Total-Time": 3694.8326177597046, "Train": {"Loss": 0.9395085070927938, "avg t": 0.9223862046135797, "plain loss": 0.12335089493327664, "standard loss": 0.09927483344188442}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.1035, "Augmented-Loss": 0.06376084455112616, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.05432941663265228, "PGD-Accuracy": 7.416666666666667, "PGD-Loss": 8.584369176228842}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 16, "Epoch-Time": 241.53422665596008, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.6199951171875, "Augmented-0.05-Quantile-Accuracy": 97.6199951171875, "Augmented-0.1-Quantile-Accuracy": 97.90999603271484, "Augmented-Accuracy": 98.7408, "Augmented-Loss": 0.09260331256389617, "Clean-Accuracy": 98.82, "Clean-Loss": 0.07201744620800019, "PGD-Accuracy": 6.89, "PGD-Loss": 8.7494423828125}, "Total-Time": 3936.3668444156647, "Train": {"Loss": 0.9392465898195903, "avg t": 0.922331743116732, "plain loss": 0.11510415739483296, "standard loss": 0.09208822237120734}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.1500015258789, "Augmented-0.05-Quantile-Accuracy": 97.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.08333587646484, "Augmented-Accuracy": 98.77833333333334, "Augmented-Loss": 0.08823814278622469, "Clean-Accuracy": 98.73333333333333, "Clean-Loss": 0.0706967859963576, "PGD-Accuracy": 6.183333333333334, "PGD-Loss": 8.699230127970377}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 17, "Epoch-Time": 206.62734484672546, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.23999786376953, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.37999725341797, "Augmented-Accuracy": 99.0228, "Augmented-Loss": 0.11127120015645027, "Clean-Accuracy": 99.14, "Clean-Loss": 0.09171957242488861, "PGD-Accuracy": 13.65, "PGD-Loss": 6.85119469909668}, "Total-Time": 4142.99418926239, "Train": {"Loss": 0.939159024503496, "avg t": 0.9223186419451678, "plain loss": 0.11633385053210789, "standard loss": 0.09447237851443115}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.93333435058594, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.10816666666666, "Augmented-Loss": 0.1026202071126302, "Clean-Accuracy": 99.15, "Clean-Loss": 0.08522281118233999, "PGD-Accuracy": 13.833333333333334, "PGD-Loss": 6.740117332458496}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 18, "Epoch-Time": 216.8325321674347, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.41999816894531, "Augmented-0.05-Quantile-Accuracy": 98.19999694824219, "Augmented-0.1-Quantile-Accuracy": 98.45999908447266, "Augmented-Accuracy": 99.0724, "Augmented-Loss": 0.08857533549642563, "Clean-Accuracy": 99.16, "Clean-Loss": 0.06937989401817322, "PGD-Accuracy": 8.98, "PGD-Loss": 7.663324453735352}, "Total-Time": 4359.826721429825, "Train": {"Loss": 0.9390669786135356, "avg t": 0.9222932914804529, "plain loss": 0.11664579934014226, "standard loss": 0.09435567952968456}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.86666870117188, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.12616666666666, "Augmented-Loss": 0.08454836216052374, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.06796465851863226, "PGD-Accuracy": 9.25, "PGD-Loss": 7.576590108235677}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 19, "Epoch-Time": 241.20165705680847, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.40999603271484, "Augmented-0.05-Quantile-Accuracy": 98.23999786376953, "Augmented-0.1-Quantile-Accuracy": 98.47999572753906, "Augmented-Accuracy": 99.0442, "Augmented-Loss": 0.0871795448167324, "Clean-Accuracy": 99.16, "Clean-Loss": 0.0683232612490654, "PGD-Accuracy": 10.34, "PGD-Loss": 6.842151748657226}, "Total-Time": 4601.028378486633, "Train": {"Loss": 0.9389879009458754, "avg t": 0.9222685831564444, "plain loss": 0.11508894632833981, "standard loss": 0.09041140437346917}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.71666717529297, "Augmented-0.05-Quantile-Accuracy": 98.36666870117188, "Augmented-0.1-Quantile-Accuracy": 98.51666259765625, "Augmented-Accuracy": 99.02616666666667, "Augmented-Loss": 0.08314489974300067, "Clean-Accuracy": 99.15, "Clean-Loss": 0.06673846245805422, "PGD-Accuracy": 10.266666666666667, "PGD-Loss": 6.814341023763021}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 20, "Epoch-Time": 241.4107768535614, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.5, "Augmented-0.05-Quantile-Accuracy": 98.32999420166016, "Augmented-0.1-Quantile-Accuracy": 98.50999450683594, "Augmented-Accuracy": 99.0687, "Augmented-Loss": 0.08349402162265777, "Clean-Accuracy": 99.14, "Clean-Loss": 0.07020365628004074, "PGD-Accuracy": 8.36, "PGD-Loss": 7.437487313842773}, "Total-Time": 4842.439155340195, "Train": {"Loss": 0.9389593815273709, "avg t": 0.9222679894235399, "plain loss": 0.11110129362035684, "standard loss": 0.09099232172524488}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.10666666666667, "Augmented-Loss": 0.0790270218706131, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.06752076362570127, "PGD-Accuracy": 8.816666666666666, "PGD-Loss": 7.414130381266276}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 21, "Epoch-Time": 241.1717128753662, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.50999450683594, "Augmented-0.05-Quantile-Accuracy": 98.19999694824219, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.0882, "Augmented-Loss": 0.08861516533112526, "Clean-Accuracy": 99.18, "Clean-Loss": 0.07013919370174408, "PGD-Accuracy": 8.99, "PGD-Loss": 8.264518991088867}, "Total-Time": 5083.610868215561, "Train": {"Loss": 0.9390849880289148, "avg t": 0.9222801261654606, "plain loss": 0.11384100396544837, "standard loss": 0.09622871398705023}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.91666412353516, "Augmented-0.05-Quantile-Accuracy": 98.51666259765625, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.1545, "Augmented-Loss": 0.08446871649066608, "Clean-Accuracy": 99.3, "Clean-Loss": 0.06805676968892416, "PGD-Accuracy": 8.666666666666666, "PGD-Loss": 8.238925196329753}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 22, "Epoch-Time": 238.7939374446869, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.19999694824219, "Augmented-0.05-Quantile-Accuracy": 97.93999481201172, "Augmented-0.1-Quantile-Accuracy": 98.32999420166016, "Augmented-Accuracy": 98.9183, "Augmented-Loss": 0.08064165564656257, "Clean-Accuracy": 98.97, "Clean-Loss": 0.06126517325639725, "PGD-Accuracy": 7.92, "PGD-Loss": 6.9697468475341795}, "Total-Time": 5322.404805660248, "Train": {"Loss": 0.9387431230368437, "avg t": 0.9222299230010421, "plain loss": 0.10790418820027972, "standard loss": 0.08284755532167576}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.63333129882812, "Augmented-0.05-Quantile-Accuracy": 98.28333282470703, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 98.99783333333333, "Augmented-Loss": 0.07616319141189257, "Clean-Accuracy": 99.05, "Clean-Loss": 0.059440857350826264, "PGD-Accuracy": 8.083333333333334, "PGD-Loss": 6.769102083841959}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 23, "Epoch-Time": 201.0979347229004, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.41999816894531, "Augmented-0.05-Quantile-Accuracy": 98.16999816894531, "Augmented-0.1-Quantile-Accuracy": 98.3699951171875, "Augmented-Accuracy": 99.0481, "Augmented-Loss": 0.07702991751170159, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05772026681900024, "PGD-Accuracy": 4.58, "PGD-Loss": 8.728483544921875}, "Total-Time": 5523.502740383148, "Train": {"Loss": 0.9387805117324547, "avg t": 0.9222228326797486, "plain loss": 0.11129172501387427, "standard loss": 0.08409571591130009}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.8499984741211, "Augmented-0.05-Quantile-Accuracy": 98.43333435058594, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.06883333333333, "Augmented-Loss": 0.0740345293277502, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.057341255267461144, "PGD-Accuracy": 4.633333333333334, "PGD-Loss": 8.592876124064128}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 24, "Epoch-Time": 230.20753455162048, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.11000061035156, "Augmented-0.05-Quantile-Accuracy": 97.94999694824219, "Augmented-0.1-Quantile-Accuracy": 98.27999877929688, "Augmented-Accuracy": 98.9116, "Augmented-Loss": 0.10550987478637695, "Clean-Accuracy": 98.96, "Clean-Loss": 0.08310305626392364, "PGD-Accuracy": 13.06, "PGD-Loss": 6.303566186523438}, "Total-Time": 5753.710274934769, "Train": {"Loss": 0.9387291302504363, "avg t": 0.9222152459533126, "plain loss": 0.10901704148539772, "standard loss": 0.08066345107996906}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.68333435058594, "Augmented-0.05-Quantile-Accuracy": 98.25, "Augmented-0.1-Quantile-Accuracy": 98.46666717529297, "Augmented-Accuracy": 99.00216666666667, "Augmented-Loss": 0.09892632361789544, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.07911829535166423, "PGD-Accuracy": 13.65, "PGD-Loss": 6.171603815714518}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 25, "Epoch-Time": 241.1881992816925, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.56999969482422, "Augmented-0.05-Quantile-Accuracy": 98.20999908447266, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 99.0987, "Augmented-Loss": 0.07302026276016235, "Clean-Accuracy": 99.21, "Clean-Loss": 0.057206352841854095, "PGD-Accuracy": 5.07, "PGD-Loss": 8.522790740966796}, "Total-Time": 5994.898474216461, "Train": {"Loss": 0.93875094710456, "avg t": 0.9222139449825993, "plain loss": 0.10984555962527237, "standard loss": 0.08559870104105384}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.12616666666666, "Augmented-Loss": 0.0692556767074267, "Clean-Accuracy": 99.2, "Clean-Loss": 0.055676091839869817, "PGD-Accuracy": 5.766666666666667, "PGD-Loss": 8.396088821411134}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 26, "Epoch-Time": 241.22238159179688, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.44999694824219, "Augmented-0.05-Quantile-Accuracy": 98.18999481201172, "Augmented-0.1-Quantile-Accuracy": 98.47999572753906, "Augmented-Accuracy": 99.093, "Augmented-Loss": 0.09394859969210624, "Clean-Accuracy": 99.18, "Clean-Loss": 0.06891120674610138, "PGD-Accuracy": 10.33, "PGD-Loss": 7.323901669311524}, "Total-Time": 6236.120855808258, "Train": {"Loss": 0.9388154414848046, "avg t": 0.9222341847066526, "plain loss": 0.11228607257030614, "standard loss": 0.08205079020063083}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.01666259765625, "Augmented-0.05-Quantile-Accuracy": 98.48332977294922, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.129, "Augmented-Loss": 0.08757813403725624, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.0658479714691639, "PGD-Accuracy": 10.566666666666666, "PGD-Loss": 7.265032338460286}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 27, "Epoch-Time": 241.18104076385498, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.41999816894531, "Augmented-0.05-Quantile-Accuracy": 98.16999816894531, "Augmented-0.1-Quantile-Accuracy": 98.41999816894531, "Augmented-Accuracy": 99.0465, "Augmented-Loss": 0.10764727552604675, "Clean-Accuracy": 99.15, "Clean-Loss": 0.08647339949607849, "PGD-Accuracy": 13.81, "PGD-Loss": 6.277953387451172}, "Total-Time": 6477.301896572113, "Train": {"Loss": 0.9386862835530881, "avg t": 0.9222056663301256, "plain loss": 0.11310871359860453, "standard loss": 0.08732130671872033}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.9000015258789, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.142, "Augmented-Loss": 0.09851726792693138, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.07958978547652562, "PGD-Accuracy": 14.683333333333334, "PGD-Loss": 6.210713628133138}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 28, "Epoch-Time": 204.76540684700012, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.37999725341797, "Augmented-0.05-Quantile-Accuracy": 98.13999938964844, "Augmented-0.1-Quantile-Accuracy": 98.40999603271484, "Augmented-Accuracy": 99.0165, "Augmented-Loss": 0.09612643516778946, "Clean-Accuracy": 99.11, "Clean-Loss": 0.07643065123558045, "PGD-Accuracy": 8.57, "PGD-Loss": 7.037353005981445}, "Total-Time": 6682.067303419113, "Train": {"Loss": 0.9385986972738195, "avg t": 0.9221897677138999, "plain loss": 0.10876969250573049, "standard loss": 0.08748006319558178}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.03333282470703, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.125, "Augmented-Loss": 0.0897481528155009, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.07210327158371607, "PGD-Accuracy": 9.366666666666667, "PGD-Loss": 6.922649353027344}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 29, "Epoch-Time": 218.73866724967957, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.25999450683594, "Augmented-0.1-Quantile-Accuracy": 98.47999572753906, "Augmented-Accuracy": 99.1038, "Augmented-Loss": 0.06762763770282268, "Clean-Accuracy": 99.12, "Clean-Loss": 0.060384349954128266, "PGD-Accuracy": 3.73, "PGD-Loss": 8.47435346069336}, "Total-Time": 6900.805970668793, "Train": {"Loss": 0.9386194439817358, "avg t": 0.9221884662663495, "plain loss": 0.10853980097770695, "standard loss": 0.0887202530503273}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.143, "Augmented-Loss": 0.06451467574775219, "Clean-Accuracy": 99.15, "Clean-Loss": 0.058082408477862675, "PGD-Accuracy": 3.716666666666667, "PGD-Loss": 8.339780415852864}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 30, "Epoch-Time": 241.22998785972595, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.5199966430664, "Augmented-0.05-Quantile-Accuracy": 98.15999603271484, "Augmented-0.1-Quantile-Accuracy": 98.38999938964844, "Augmented-Accuracy": 99.03, "Augmented-Loss": 0.09217356607437134, "Clean-Accuracy": 99.11, "Clean-Loss": 0.06901859838962555, "PGD-Accuracy": 11.92, "PGD-Loss": 7.02951100769043}, "Total-Time": 7142.035958528519, "Train": {"Loss": 0.9387147053082784, "avg t": 0.9221976435802601, "plain loss": 0.10902255215468226, "standard loss": 0.08734578385176482}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.03333282470703, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.13466666666666, "Augmented-Loss": 0.08467290451625983, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.06439832947651546, "PGD-Accuracy": 11.45, "PGD-Loss": 7.054815984090169}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 31, "Epoch-Time": 241.29436087608337, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.62999725341797, "Augmented-0.05-Quantile-Accuracy": 98.25999450683594, "Augmented-0.1-Quantile-Accuracy": 98.54000091552734, "Augmented-Accuracy": 99.121, "Augmented-Loss": 0.07413407611894608, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05929060989618301, "PGD-Accuracy": 4.87, "PGD-Loss": 7.906742028808594}, "Total-Time": 7383.330319404602, "Train": {"Loss": 0.9385343882242838, "avg t": 0.9221656703419155, "plain loss": 0.10858947316275705, "standard loss": 0.08556394011003}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.1675, "Augmented-Loss": 0.06945728126307328, "Clean-Accuracy": 99.2, "Clean-Loss": 0.056696721742550533, "PGD-Accuracy": 5.966666666666667, "PGD-Loss": 7.711247467041016}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 32, "Epoch-Time": 241.1218991279602, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.52999877929688, "Augmented-0.05-Quantile-Accuracy": 98.18000030517578, "Augmented-0.1-Quantile-Accuracy": 98.47000122070312, "Augmented-Accuracy": 99.0783, "Augmented-Loss": 0.0764836107776165, "Clean-Accuracy": 99.11, "Clean-Loss": 0.06175743968486786, "PGD-Accuracy": 2.93, "PGD-Loss": 8.011641082763672}, "Total-Time": 7624.452218532562, "Train": {"Loss": 0.9385737094349331, "avg t": 0.9221723579477381, "plain loss": 0.1067806207762824, "standard loss": 0.08482892853683896}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.9000015258789, "Augmented-0.05-Quantile-Accuracy": 98.38333129882812, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.11633333333333, "Augmented-Loss": 0.07112715053876241, "Clean-Accuracy": 99.15, "Clean-Loss": 0.05862768921256065, "PGD-Accuracy": 3.2666666666666666, "PGD-Loss": 7.873251825968424}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 33, "Epoch-Time": 236.54335641860962, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.73999786376953, "Augmented-0.05-Quantile-Accuracy": 98.27999877929688, "Augmented-0.1-Quantile-Accuracy": 98.5199966430664, "Augmented-Accuracy": 99.1056, "Augmented-Loss": 0.07438237858223914, "Clean-Accuracy": 99.14, "Clean-Loss": 0.0571863273024559, "PGD-Accuracy": 5.39, "PGD-Loss": 7.7366810821533205}, "Total-Time": 7860.995574951172, "Train": {"Loss": 0.938588892088996, "avg t": 0.9221814874013265, "plain loss": 0.10655541090788667, "standard loss": 0.07988727658766287}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.16183333333333, "Augmented-Loss": 0.07062517900248369, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05543793172637622, "PGD-Accuracy": 5.866666666666666, "PGD-Loss": 7.673545918782552}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 34, "Epoch-Time": 202.35085010528564, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68999481201172, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.1222, "Augmented-Loss": 0.07505731151521206, "Clean-Accuracy": 99.19, "Clean-Loss": 0.058481947445869445, "PGD-Accuracy": 5.66, "PGD-Loss": 7.365194436645508}, "Total-Time": 8063.3464250564575, "Train": {"Loss": 0.9385212805182845, "avg t": 0.9221616367410731, "plain loss": 0.10544469986668327, "standard loss": 0.08141864820983674}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.16633333333333, "Augmented-Loss": 0.06978057740052541, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05544043815135956, "PGD-Accuracy": 6.266666666666667, "PGD-Loss": 7.342965799967448}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 35, "Epoch-Time": 231.80716490745544, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.77999877929688, "Augmented-0.05-Quantile-Accuracy": 98.33999633789062, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.1543, "Augmented-Loss": 0.06523139632308483, "Clean-Accuracy": 99.28, "Clean-Loss": 0.05303081089258194, "PGD-Accuracy": 2.62, "PGD-Loss": 8.865813433837891}, "Total-Time": 8295.153589963913, "Train": {"Loss": 0.9385862772906268, "avg t": 0.9221657193678396, "plain loss": 0.10908681069303447, "standard loss": 0.08615350947335915}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.18783333333333, "Augmented-Loss": 0.06143830383112033, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.051160139779249825, "PGD-Accuracy": 2.9166666666666665, "PGD-Loss": 8.84834230041504}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 36, "Epoch-Time": 241.23515701293945, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.6199951171875, "Augmented-0.05-Quantile-Accuracy": 98.30999755859375, "Augmented-0.1-Quantile-Accuracy": 98.54000091552734, "Augmented-Accuracy": 99.1296, "Augmented-Loss": 0.09256746496677398, "Clean-Accuracy": 99.23, "Clean-Loss": 0.07362631573677063, "PGD-Accuracy": 6.95, "PGD-Loss": 7.125388635253906}, "Total-Time": 8536.388746976852, "Train": {"Loss": 0.9384610312073319, "avg t": 0.9221473463729576, "plain loss": 0.1059459533726728, "standard loss": 0.08335436181668882}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.88333129882812, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.132, "Augmented-Loss": 0.08657641230066618, "Clean-Accuracy": 99.2, "Clean-Loss": 0.06979852344592412, "PGD-Accuracy": 6.85, "PGD-Loss": 7.05494004313151}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 37, "Epoch-Time": 241.3237247467041, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.54000091552734, "Augmented-0.05-Quantile-Accuracy": 98.2699966430664, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.0754, "Augmented-Loss": 0.06737288104820252, "Clean-Accuracy": 99.09, "Clean-Loss": 0.05436955908536911, "PGD-Accuracy": 2.17, "PGD-Loss": 8.267681970214843}, "Total-Time": 8777.712471723557, "Train": {"Loss": 0.9384442558641787, "avg t": 0.9221456258208663, "plain loss": 0.10511097740597185, "standard loss": 0.08327914463590692}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.104, "Augmented-Loss": 0.06512501077761253, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05402949906388919, "PGD-Accuracy": 2.6, "PGD-Loss": 8.05478667195638}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 38, "Epoch-Time": 240.96658992767334, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72000122070312, "Augmented-0.05-Quantile-Accuracy": 98.33999633789062, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.1426, "Augmented-Loss": 0.08735152254080772, "Clean-Accuracy": 99.23, "Clean-Loss": 0.06323379167318344, "PGD-Accuracy": 8.1, "PGD-Loss": 7.259441445922851}, "Total-Time": 9018.67906165123, "Train": {"Loss": 0.9384188543425666, "avg t": 0.9221418963891489, "plain loss": 0.10250117517400682, "standard loss": 0.07868334856298234}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.1725, "Augmented-Loss": 0.08247540637870629, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.06115504561861356, "PGD-Accuracy": 8.833333333333334, "PGD-Loss": 7.1670706075032555}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 39, "Epoch-Time": 206.10409116744995, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68999481201172, "Augmented-0.05-Quantile-Accuracy": 98.33999633789062, "Augmented-0.1-Quantile-Accuracy": 98.52999877929688, "Augmented-Accuracy": 99.1122, "Augmented-Loss": 0.08128841429781913, "Clean-Accuracy": 99.12, "Clean-Loss": 0.0660798591375351, "PGD-Accuracy": 5.84, "PGD-Loss": 7.35775855102539}, "Total-Time": 9224.78315281868, "Train": {"Loss": 0.9384595908412227, "avg t": 0.9221453694944028, "plain loss": 0.10731175177009013, "standard loss": 0.08287220877188223}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.11666870117188, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.16333333333333, "Augmented-Loss": 0.0764721600941817, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.0626509530643622, "PGD-Accuracy": 6.166666666666667, "PGD-Loss": 7.2707669525146486}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 40, "Epoch-Time": 219.17434906959534, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.62999725341797, "Augmented-0.05-Quantile-Accuracy": 98.37999725341797, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.1183, "Augmented-Loss": 0.08329269646739959, "Clean-Accuracy": 99.21, "Clean-Loss": 0.06809019575119019, "PGD-Accuracy": 5.78, "PGD-Loss": 7.49159499206543}, "Total-Time": 9443.957501888275, "Train": {"Loss": 0.9384778882485849, "avg t": 0.9221408997641669, "plain loss": 0.10385401815131867, "standard loss": 0.08422494907953121}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.93333435058594, "Augmented-0.05-Quantile-Accuracy": 98.51666259765625, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.17883333333333, "Augmented-Loss": 0.07805634515364965, "Clean-Accuracy": 99.3, "Clean-Loss": 0.06426020193099975, "PGD-Accuracy": 5.983333333333333, "PGD-Loss": 7.488972559611002}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 41, "Epoch-Time": 241.3213894367218, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.61000061035156, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.0873, "Augmented-Loss": 0.075429294023633, "Clean-Accuracy": 99.18, "Clean-Loss": 0.06147803738117218, "PGD-Accuracy": 6.91, "PGD-Loss": 7.185584066772461}, "Total-Time": 9685.278891324997, "Train": {"Loss": 0.9383988555978846, "avg t": 0.922127670817905, "plain loss": 0.10534867464348116, "standard loss": 0.0831797421861578}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.18516666666666, "Augmented-Loss": 0.06886804103712241, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05647700464725494, "PGD-Accuracy": 6.916666666666667, "PGD-Loss": 7.168147527058919}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 42, "Epoch-Time": 241.3184609413147, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.45999908447266, "Augmented-0.05-Quantile-Accuracy": 98.14999389648438, "Augmented-0.1-Quantile-Accuracy": 98.47000122070312, "Augmented-Accuracy": 99.0506, "Augmented-Loss": 0.09571391515493392, "Clean-Accuracy": 99.17, "Clean-Loss": 0.08092829029560089, "PGD-Accuracy": 6.28, "PGD-Loss": 7.2399219696044925}, "Total-Time": 9926.597352266312, "Train": {"Loss": 0.9384810277797557, "avg t": 0.9221362376742893, "plain loss": 0.10665004109983067, "standard loss": 0.08484789324469036}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.8499984741211, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.121, "Augmented-Loss": 0.08948773869295915, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.07593823383251826, "PGD-Accuracy": 6.383333333333334, "PGD-Loss": 7.206389523824056}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 43, "Epoch-Time": 241.30994296073914, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.5199966430664, "Augmented-0.05-Quantile-Accuracy": 98.30999755859375, "Augmented-0.1-Quantile-Accuracy": 98.50999450683594, "Augmented-Accuracy": 99.0816, "Augmented-Loss": 0.08986045512771607, "Clean-Accuracy": 99.15, "Clean-Loss": 0.0723200804233551, "PGD-Accuracy": 7.64, "PGD-Loss": 7.1899270294189455}, "Total-Time": 10167.90729522705, "Train": {"Loss": 0.9383776542875502, "avg t": 0.9221238121103358, "plain loss": 0.10550990409144656, "standard loss": 0.08452630413020099}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.1525, "Augmented-Loss": 0.08507939102033774, "Clean-Accuracy": 99.25, "Clean-Loss": 0.0693899262547493, "PGD-Accuracy": 7.566666666666666, "PGD-Loss": 7.147736063639323}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 44, "Epoch-Time": 233.08552837371826, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.61000061035156, "Augmented-0.05-Quantile-Accuracy": 98.39999389648438, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.161, "Augmented-Loss": 0.07095879525840282, "Clean-Accuracy": 99.24, "Clean-Loss": 0.055753618454933165, "PGD-Accuracy": 4.24, "PGD-Loss": 7.654054440307617}, "Total-Time": 10400.992823600769, "Train": {"Loss": 0.9383501645900585, "avg t": 0.922115082387571, "plain loss": 0.10197036352864028, "standard loss": 0.07987539558057431}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.2045, "Augmented-Loss": 0.06732101701617241, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.054122420489788055, "PGD-Accuracy": 4.616666666666666, "PGD-Loss": 7.598330352783203}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 45, "Epoch-Time": 203.5887954235077, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.63999938964844, "Augmented-0.05-Quantile-Accuracy": 98.22000122070312, "Augmented-0.1-Quantile-Accuracy": 98.47000122070312, "Augmented-Accuracy": 99.0786, "Augmented-Loss": 0.07328907594513893, "Clean-Accuracy": 99.2, "Clean-Loss": 0.06253341159820557, "PGD-Accuracy": 5.17, "PGD-Loss": 7.7083100372314455}, "Total-Time": 10604.581619024277, "Train": {"Loss": 0.9383622232366491, "avg t": 0.9221230884304753, "plain loss": 0.10033475728388193, "standard loss": 0.0779363117173866}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.04999542236328, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.1325, "Augmented-Loss": 0.06885042318801085, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05918663168946902, "PGD-Accuracy": 5.733333333333333, "PGD-Loss": 7.531472539265951}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 46, "Epoch-Time": 233.5933563709259, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.57999420166016, "Augmented-0.05-Quantile-Accuracy": 98.37999725341797, "Augmented-0.1-Quantile-Accuracy": 98.55999755859375, "Augmented-Accuracy": 99.104, "Augmented-Loss": 0.08364861069369316, "Clean-Accuracy": 99.19, "Clean-Loss": 0.0669013200044632, "PGD-Accuracy": 9.15, "PGD-Loss": 6.910525231933594}, "Total-Time": 10838.174975395203, "Train": {"Loss": 0.9384444068626121, "avg t": 0.9221374592427855, "plain loss": 0.10357828453911681, "standard loss": 0.08160815493486545}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.03333282470703, "Augmented-0.05-Quantile-Accuracy": 98.43333435058594, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.14983333333333, "Augmented-Loss": 0.07752228832026323, "Clean-Accuracy": 99.25, "Clean-Loss": 0.062191287606954575, "PGD-Accuracy": 8.9, "PGD-Loss": 6.776858749389649}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 47, "Epoch-Time": 241.521648645401, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.83999633789062, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.58999633789062, "Augmented-Accuracy": 99.1703, "Augmented-Loss": 0.07227129284131527, "Clean-Accuracy": 99.22, "Clean-Loss": 0.05816317839622497, "PGD-Accuracy": 6.65, "PGD-Loss": 7.415786056518555}, "Total-Time": 11079.696624040604, "Train": {"Loss": 0.9383235009864525, "avg t": 0.9221230404112074, "plain loss": 0.10309482662412857, "standard loss": 0.0817369665393123}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.2075, "Augmented-Loss": 0.06860742990493775, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05600967087348302, "PGD-Accuracy": 6.083333333333333, "PGD-Loss": 7.336487782796224}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 48, "Epoch-Time": 241.28920555114746, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68999481201172, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.50999450683594, "Augmented-Accuracy": 99.1058, "Augmented-Loss": 0.07753156869912148, "Clean-Accuracy": 99.21, "Clean-Loss": 0.061598768365383146, "PGD-Accuracy": 5.27, "PGD-Loss": 7.623228015136719}, "Total-Time": 11320.985829591751, "Train": {"Loss": 0.9383706444104513, "avg t": 0.9221092320371557, "plain loss": 0.10123600789705924, "standard loss": 0.07761350847835893}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2005, "Augmented-Loss": 0.07202886510034402, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.057912690341472624, "PGD-Accuracy": 5.433333333333334, "PGD-Loss": 7.578010243733724}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 49, "Epoch-Time": 241.7020959854126, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.8699951171875, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.6199951171875, "Augmented-Accuracy": 99.135, "Augmented-Loss": 0.07256681474971771, "Clean-Accuracy": 99.19, "Clean-Loss": 0.05951875727176666, "PGD-Accuracy": 6.33, "PGD-Loss": 7.480817163085938}, "Total-Time": 11562.687925577164, "Train": {"Loss": 0.9383579171851829, "avg t": 0.9221236826931989, "plain loss": 0.10531230301327178, "standard loss": 0.08601054782999887}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.94999694824219, "Augmented-Accuracy": 99.2145, "Augmented-Loss": 0.0687596480302016, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05720019439856212, "PGD-Accuracy": 6.516666666666667, "PGD-Loss": 7.5100962320963545}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 50, "Epoch-Time": 206.96825170516968, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.39999389648438, "Augmented-0.05-Quantile-Accuracy": 98.20999908447266, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 99.038, "Augmented-Loss": 0.08965808851265908, "Clean-Accuracy": 99.05, "Clean-Loss": 0.07104314903020859, "PGD-Accuracy": 6.71, "PGD-Loss": 6.464453790283203}, "Total-Time": 11769.656177282333, "Train": {"Loss": 0.9383063581431353, "avg t": 0.9221048429453814, "plain loss": 0.10464946802280559, "standard loss": 0.08128395873749697}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.98332977294922, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.1605, "Augmented-Loss": 0.08159017061988513, "Clean-Accuracy": 99.25, "Clean-Loss": 0.06463427176078161, "PGD-Accuracy": 6.95, "PGD-Loss": 6.415250829060873}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 51, "Epoch-Time": 219.90958285331726, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.54000091552734, "Augmented-0.05-Quantile-Accuracy": 98.22999572753906, "Augmented-0.1-Quantile-Accuracy": 98.5199966430664, "Augmented-Accuracy": 99.0838, "Augmented-Loss": 0.07552929935085774, "Clean-Accuracy": 99.14, "Clean-Loss": 0.06330279220342636, "PGD-Accuracy": 4.99, "PGD-Loss": 7.515186877441407}, "Total-Time": 11989.56576013565, "Train": {"Loss": 0.9383120154804654, "avg t": 0.9220959369518139, "plain loss": 0.10057070393915522, "standard loss": 0.07970125746947748}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.1225, "Augmented-Loss": 0.07137877118567626, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.06032342619697253, "PGD-Accuracy": 5.05, "PGD-Loss": 7.449253423055013}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 52, "Epoch-Time": 241.29871773719788, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.83999633789062, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.187, "Augmented-Loss": 0.07728818088936806, "Clean-Accuracy": 99.27, "Clean-Loss": 0.06282260859012603, "PGD-Accuracy": 4.02, "PGD-Loss": 7.938301983642578}, "Total-Time": 12230.864477872849, "Train": {"Loss": 0.9383017082214355, "avg t": 0.9221078328909698, "plain loss": 0.10176568811028093, "standard loss": 0.08345339182791886}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.2005, "Augmented-Loss": 0.07301693047066529, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.059801795115073525, "PGD-Accuracy": 4.383333333333334, "PGD-Loss": 7.885599441528321}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 53, "Epoch-Time": 241.42147827148438, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.8699951171875, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.5999984741211, "Augmented-Accuracy": 99.1564, "Augmented-Loss": 0.08534652827072144, "Clean-Accuracy": 99.2, "Clean-Loss": 0.07225840363502502, "PGD-Accuracy": 5.41, "PGD-Loss": 6.929519198608398}, "Total-Time": 12472.285956144333, "Train": {"Loss": 0.9383999018669128, "avg t": 0.9221195837126838, "plain loss": 0.104684231182381, "standard loss": 0.0849328472746743}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.18716666666667, "Augmented-Loss": 0.07964759688258172, "Clean-Accuracy": 99.25, "Clean-Loss": 0.06744174426794051, "PGD-Accuracy": 5.733333333333333, "PGD-Loss": 6.882235768636067}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 54, "Epoch-Time": 241.41589450836182, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68999481201172, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.1555, "Augmented-Loss": 0.07381560587239265, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05981305544376373, "PGD-Accuracy": 5.49, "PGD-Loss": 7.5785043334960935}, "Total-Time": 12713.701850652695, "Train": {"Loss": 0.9382944448965567, "avg t": 0.9221108556323582, "plain loss": 0.10119874307491145, "standard loss": 0.08293668842426052}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.11133333333333, "Augmented-Loss": 0.07012346340894698, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05757455587387085, "PGD-Accuracy": 6.066666666666666, "PGD-Loss": 7.441327219645182}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 55, "Epoch-Time": 229.5269913673401, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.73999786376953, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.1331, "Augmented-Loss": 0.08306861501765252, "Clean-Accuracy": 99.19, "Clean-Loss": 0.06346665343046189, "PGD-Accuracy": 6.92, "PGD-Loss": 6.841193145751953}, "Total-Time": 12943.228842020035, "Train": {"Loss": 0.9383584231270684, "avg t": 0.9221127856925682, "plain loss": 0.10407040530310746, "standard loss": 0.08337811002466414}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.19, "Augmented-Loss": 0.07687464896996817, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05934790658950806, "PGD-Accuracy": 7.9, "PGD-Loss": 6.721912625630696}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 56, "Epoch-Time": 206.44179940223694, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.63999938964844, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.5999984741211, "Augmented-Accuracy": 99.0958, "Augmented-Loss": 0.07583111296057701, "Clean-Accuracy": 99.11, "Clean-Loss": 0.06324393576383591, "PGD-Accuracy": 3.83, "PGD-Loss": 7.5632871276855465}, "Total-Time": 13149.670641422272, "Train": {"Loss": 0.9383476488501937, "avg t": 0.9221117228402032, "plain loss": 0.09986590528488151, "standard loss": 0.07631352160595081}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.01666259765625, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.16916666666667, "Augmented-Loss": 0.07181690643846989, "Clean-Accuracy": 99.25, "Clean-Loss": 0.060312602182229356, "PGD-Accuracy": 4.033333333333333, "PGD-Loss": 7.493193201700846}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 57, "Epoch-Time": 235.0916440486908, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.77999877929688, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1629, "Augmented-Loss": 0.08127392501068115, "Clean-Accuracy": 99.26, "Clean-Loss": 0.06500437389612197, "PGD-Accuracy": 4.16, "PGD-Loss": 7.710548678588867}, "Total-Time": 13384.762285470963, "Train": {"Loss": 0.9383400908576117, "avg t": 0.9220986706239206, "plain loss": 0.10254971409373823, "standard loss": 0.0802691050502989}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.19416666666666, "Augmented-Loss": 0.07630928800185521, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.06185444423556328, "PGD-Accuracy": 4.533333333333333, "PGD-Loss": 7.584811899820964}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 58, "Epoch-Time": 241.4814682006836, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.52999877929688, "Augmented-0.05-Quantile-Accuracy": 98.30999755859375, "Augmented-0.1-Quantile-Accuracy": 98.54000091552734, "Augmented-Accuracy": 99.0906, "Augmented-Loss": 0.07698516294074058, "Clean-Accuracy": 99.12, "Clean-Loss": 0.060323350822925566, "PGD-Accuracy": 5.46, "PGD-Loss": 6.920002032470703}, "Total-Time": 13626.243753671646, "Train": {"Loss": 0.9383175526018496, "avg t": 0.9221088776411833, "plain loss": 0.10153327841935332, "standard loss": 0.08167782334265886}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.38333129882812, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.13216666666666, "Augmented-Loss": 0.07163004043499628, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05691304921110471, "PGD-Accuracy": 5.683333333333334, "PGD-Loss": 6.848731063842774}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 59, "Epoch-Time": 241.31629252433777, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.48999786376953, "Augmented-0.05-Quantile-Accuracy": 98.14999389648438, "Augmented-0.1-Quantile-Accuracy": 98.39999389648438, "Augmented-Accuracy": 99.0057, "Augmented-Loss": 0.07553147599828243, "Clean-Accuracy": 99.05, "Clean-Loss": 0.05764658017158508, "PGD-Accuracy": 4.89, "PGD-Loss": 7.099517373657227}, "Total-Time": 13867.560046195984, "Train": {"Loss": 0.9383472014179937, "avg t": 0.9221073180657846, "plain loss": 0.10078753532480302, "standard loss": 0.07978422950152998}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.93333435058594, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.11083333333333, "Augmented-Loss": 0.07071054222563902, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.0549172743956248, "PGD-Accuracy": 4.75, "PGD-Loss": 7.077435674031576}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 60, "Epoch-Time": 241.44194507598877, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.62999725341797, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.58999633789062, "Augmented-Accuracy": 99.1171, "Augmented-Loss": 0.07122588554859162, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05536856302022934, "PGD-Accuracy": 5.25, "PGD-Loss": 6.977882449340821}, "Total-Time": 14109.001991271973, "Train": {"Loss": 0.9382633593523944, "avg t": 0.922090778156563, "plain loss": 0.10075443196120083, "standard loss": 0.07530513248399452}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.1595, "Augmented-Loss": 0.06657908144225677, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.052557794690132144, "PGD-Accuracy": 5.783333333333333, "PGD-Loss": 6.897683904012045}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 61, "Epoch-Time": 208.24947381019592, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.1896, "Augmented-Loss": 0.07243177162504197, "Clean-Accuracy": 99.23, "Clean-Loss": 0.05829844168424606, "PGD-Accuracy": 3.11, "PGD-Loss": 8.116542889404297}, "Total-Time": 14317.251465082169, "Train": {"Loss": 0.9382105586617081, "avg t": 0.9220711026368318, "plain loss": 0.09876009164033096, "standard loss": 0.0782096395558781}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.21983333333333, "Augmented-Loss": 0.0694909059458971, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05665184025963148, "PGD-Accuracy": 3.283333333333333, "PGD-Loss": 8.075047637939454}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 62, "Epoch-Time": 220.6180944442749, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.43000030517578, "Augmented-0.05-Quantile-Accuracy": 98.14999389648438, "Augmented-0.1-Quantile-Accuracy": 98.40999603271484, "Augmented-Accuracy": 98.9818, "Augmented-Loss": 0.08132605418157578, "Clean-Accuracy": 99.03, "Clean-Loss": 0.062448390555381775, "PGD-Accuracy": 5.37, "PGD-Loss": 7.1137545166015625}, "Total-Time": 14537.869559526443, "Train": {"Loss": 0.9382504130646034, "avg t": 0.9220906641395004, "plain loss": 0.09930707682326997, "standard loss": 0.07523877233818725}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.8499984741211, "Augmented-0.05-Quantile-Accuracy": 98.4000015258789, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.1325, "Augmented-Loss": 0.07670337666114171, "Clean-Accuracy": 99.25, "Clean-Loss": 0.06002425687511762, "PGD-Accuracy": 6.033333333333333, "PGD-Loss": 7.0882527516682945}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 63, "Epoch-Time": 241.24951100349426, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.86000061035156, "Augmented-0.05-Quantile-Accuracy": 98.33999633789062, "Augmented-0.1-Quantile-Accuracy": 98.54000091552734, "Augmented-Accuracy": 99.1528, "Augmented-Loss": 0.07850775784659386, "Clean-Accuracy": 99.18, "Clean-Loss": 0.061826234686374666, "PGD-Accuracy": 5.06, "PGD-Loss": 7.487513619995117}, "Total-Time": 14779.119070529938, "Train": {"Loss": 0.9382706173261006, "avg t": 0.9220944262787147, "plain loss": 0.09861994473139445, "standard loss": 0.07439788213703367}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.25, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.17066666666666, "Augmented-Loss": 0.07422439680198828, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05922072984774907, "PGD-Accuracy": 5.266666666666667, "PGD-Loss": 7.395167678833007}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 64, "Epoch-Time": 241.33122634887695, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.5999984741211, "Augmented-0.05-Quantile-Accuracy": 98.23999786376953, "Augmented-0.1-Quantile-Accuracy": 98.52999877929688, "Augmented-Accuracy": 99.0602, "Augmented-Loss": 0.07698929913520813, "Clean-Accuracy": 99.13, "Clean-Loss": 0.06280831686258316, "PGD-Accuracy": 4.86, "PGD-Loss": 7.308339590454102}, "Total-Time": 15020.450296878815, "Train": {"Loss": 0.9383263420882049, "avg t": 0.922106064831769, "plain loss": 0.10170240396923498, "standard loss": 0.07747790026664735}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.21066666666667, "Augmented-Loss": 0.07066558242638905, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.057930185010035835, "PGD-Accuracy": 5.583333333333333, "PGD-Loss": 7.2091145477294925}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 65, "Epoch-Time": 241.03476524353027, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.88999938964844, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1907, "Augmented-Loss": 0.07306798195505142, "Clean-Accuracy": 99.24, "Clean-Loss": 0.05833025641441345, "PGD-Accuracy": 4.34, "PGD-Loss": 7.4685906982421875}, "Total-Time": 15261.485062122345, "Train": {"Loss": 0.9382518452538384, "avg t": 0.922092096010844, "plain loss": 0.10099999651025852, "standard loss": 0.07807465347978804}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.22583333333333, "Augmented-Loss": 0.06908662984073162, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05591257841388385, "PGD-Accuracy": 5.15, "PGD-Loss": 7.414330118815104}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 66, "Epoch-Time": 225.14735579490662, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.80999755859375, "Augmented-0.05-Quantile-Accuracy": 98.43000030517578, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1583, "Augmented-Loss": 0.07068097901380062, "Clean-Accuracy": 99.22, "Clean-Loss": 0.055858576631546024, "PGD-Accuracy": 3.04, "PGD-Loss": 8.154289385986328}, "Total-Time": 15486.632417917252, "Train": {"Loss": 0.9382250952190823, "avg t": 0.9220766788765237, "plain loss": 0.0945398687397992, "standard loss": 0.07278055937201888}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.19366666666667, "Augmented-Loss": 0.06760670832157135, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.05436833195885023, "PGD-Accuracy": 3.4166666666666665, "PGD-Loss": 8.060451126098632}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 67, "Epoch-Time": 208.65227890014648, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75, "Augmented-0.05-Quantile-Accuracy": 98.3499984741211, "Augmented-0.1-Quantile-Accuracy": 98.55999755859375, "Augmented-Accuracy": 99.1042, "Augmented-Loss": 0.07769625539708137, "Clean-Accuracy": 99.18, "Clean-Loss": 0.06034361795186997, "PGD-Accuracy": 6.35, "PGD-Loss": 6.650710263061524}, "Total-Time": 15695.284696817398, "Train": {"Loss": 0.9382358775315461, "avg t": 0.9220749909612868, "plain loss": 0.09661841306333185, "standard loss": 0.07389156344422587}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.14433333333334, "Augmented-Loss": 0.07164469346721968, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05616047623753548, "PGD-Accuracy": 7.316666666666666, "PGD-Loss": 6.604319244384766}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 68, "Epoch-Time": 237.66487574577332, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72999572753906, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.55999755859375, "Augmented-Accuracy": 99.1394, "Augmented-Loss": 0.07845029052972793, "Clean-Accuracy": 99.26, "Clean-Loss": 0.05987558292150497, "PGD-Accuracy": 4.09, "PGD-Loss": 7.34607953491211}, "Total-Time": 15932.949572563171, "Train": {"Loss": 0.9382106254012497, "avg t": 0.9220823378386321, "plain loss": 0.1000284445444743, "standard loss": 0.07494335301717123}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.12583333333333, "Augmented-Loss": 0.07438368036588033, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.057730026811361315, "PGD-Accuracy": 4.616666666666666, "PGD-Loss": 7.25478369140625}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 69, "Epoch-Time": 241.2220959663391, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.63999938964844, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.1009, "Augmented-Loss": 0.07635771345353126, "Clean-Accuracy": 99.12, "Clean-Loss": 0.05804795010089874, "PGD-Accuracy": 4.37, "PGD-Loss": 7.013972415161133}, "Total-Time": 16174.17166852951, "Train": {"Loss": 0.9382005576027764, "avg t": 0.9220745572160791, "plain loss": 0.09918623769548206, "standard loss": 0.07455555589993795}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.16833333333334, "Augmented-Loss": 0.0720405362747113, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05580068192879359, "PGD-Accuracy": 4.533333333333333, "PGD-Loss": 7.008611770629883}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 70, "Epoch-Time": 241.3994963169098, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.81999969482422, "Augmented-0.05-Quantile-Accuracy": 98.37999725341797, "Augmented-0.1-Quantile-Accuracy": 98.58999633789062, "Augmented-Accuracy": 99.1673, "Augmented-Loss": 0.06554917850184441, "Clean-Accuracy": 99.29, "Clean-Loss": 0.05337892373800278, "PGD-Accuracy": 2.3, "PGD-Loss": 7.94562861328125}, "Total-Time": 16415.57116484642, "Train": {"Loss": 0.9381615873619362, "avg t": 0.9220750074033384, "plain loss": 0.09746043661258831, "standard loss": 0.07482514515188005}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.184, "Augmented-Loss": 0.062022150045633315, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.051282250066598256, "PGD-Accuracy": 2.6166666666666667, "PGD-Loss": 7.8799359181722}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 71, "Epoch-Time": 241.51887249946594, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.61000061035156, "Augmented-0.05-Quantile-Accuracy": 98.18999481201172, "Augmented-0.1-Quantile-Accuracy": 98.38999938964844, "Augmented-Accuracy": 99.0446, "Augmented-Loss": 0.07287521546936035, "Clean-Accuracy": 99.05, "Clean-Loss": 0.05891062957048416, "PGD-Accuracy": 2.45, "PGD-Loss": 7.68540608215332}, "Total-Time": 16657.090037345886, "Train": {"Loss": 0.9382648776195668, "avg t": 0.9220909059489215, "plain loss": 0.10204518587324357, "standard loss": 0.08092467514894627}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.06666564941406, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.11883333333333, "Augmented-Loss": 0.06830687198380629, "Clean-Accuracy": 99.2, "Clean-Loss": 0.055480930626392366, "PGD-Accuracy": 2.85, "PGD-Loss": 7.6478927663167315}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 72, "Epoch-Time": 208.22614669799805, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.66999816894531, "Augmented-Accuracy": 99.1779, "Augmented-Loss": 0.062387422585606575, "Clean-Accuracy": 99.22, "Clean-Loss": 0.04809588809013367, "PGD-Accuracy": 2.2, "PGD-Loss": 7.575225814819336}, "Total-Time": 16865.316184043884, "Train": {"Loss": 0.9381787490314908, "avg t": 0.9220797657613401, "plain loss": 0.09960881731068633, "standard loss": 0.07663933243354161}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.25116666666666, "Augmented-Loss": 0.058387847061753276, "Clean-Accuracy": 99.3, "Clean-Loss": 0.045965618466337524, "PGD-Accuracy": 2.55, "PGD-Loss": 7.48029551188151}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 73, "Epoch-Time": 221.87816762924194, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.70999908447266, "Augmented-0.05-Quantile-Accuracy": 98.25999450683594, "Augmented-0.1-Quantile-Accuracy": 98.48999786376953, "Augmented-Accuracy": 99.1235, "Augmented-Loss": 0.07214387392377854, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05458534023761749, "PGD-Accuracy": 2.61, "PGD-Loss": 7.284678109741211}, "Total-Time": 17087.194351673126, "Train": {"Loss": 0.9381835372006452, "avg t": 0.922066231003514, "plain loss": 0.09364561645013315, "standard loss": 0.06851653648747338}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.22183333333334, "Augmented-Loss": 0.06742956937561433, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.051941577514012655, "PGD-Accuracy": 2.566666666666667, "PGD-Loss": 7.1687414296468095}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 74, "Epoch-Time": 241.4294445514679, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.8699951171875, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.1718, "Augmented-Loss": 0.0659337226113081, "Clean-Accuracy": 99.24, "Clean-Loss": 0.05036939537525177, "PGD-Accuracy": 3.16, "PGD-Loss": 7.620784899902343}, "Total-Time": 17328.623796224594, "Train": {"Loss": 0.9382072767328333, "avg t": 0.9220670986352143, "plain loss": 0.09649040934068186, "standard loss": 0.0723300291840677}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.75, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.26383333333334, "Augmented-Loss": 0.06176019666572412, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.048189313064018885, "PGD-Accuracy": 3.816666666666667, "PGD-Loss": 7.514536499023437}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 75, "Epoch-Time": 241.61596655845642, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.39999389648438, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.2054, "Augmented-Loss": 0.07565706720781326, "Clean-Accuracy": 99.31, "Clean-Loss": 0.05634921917915344, "PGD-Accuracy": 5.04, "PGD-Loss": 7.035026635742187}, "Total-Time": 17570.23976278305, "Train": {"Loss": 0.9381997574347037, "avg t": 0.9220695097887958, "plain loss": 0.09743748085410504, "standard loss": 0.07236232867947331}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.19816666666667, "Augmented-Loss": 0.07106261122385661, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05388910103837649, "PGD-Accuracy": 5.483333333333333, "PGD-Loss": 7.069891423543294}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 76, "Epoch-Time": 241.25945472717285, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.1408, "Augmented-Loss": 0.07033384718430043, "Clean-Accuracy": 99.19, "Clean-Loss": 0.05728361209630966, "PGD-Accuracy": 3.28, "PGD-Loss": 7.599306719970703}, "Total-Time": 17811.499217510223, "Train": {"Loss": 0.9381919858720568, "avg t": 0.9220730467549076, "plain loss": 0.09646336464352091, "standard loss": 0.07088102164091888}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.2295, "Augmented-Loss": 0.06679687149624029, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05523961238066356, "PGD-Accuracy": 3.566666666666667, "PGD-Loss": 7.520521937052409}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 77, "Epoch-Time": 219.42805099487305, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.5199966430664, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.1935, "Augmented-Loss": 0.0596187529181242, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04805403652191162, "PGD-Accuracy": 1.89, "PGD-Loss": 7.961614367675781}, "Total-Time": 18030.927268505096, "Train": {"Loss": 0.93816789287991, "avg t": 0.9220589486757914, "plain loss": 0.09510273448096392, "standard loss": 0.07186180952191353}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.267, "Augmented-Loss": 0.05665953669061263, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04649108484387398, "PGD-Accuracy": 2.2666666666666666, "PGD-Loss": 7.866781616210938}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 78, "Epoch-Time": 209.08454990386963, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.77999877929688, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.58999633789062, "Augmented-Accuracy": 99.1162, "Augmented-Loss": 0.06779148389208317, "Clean-Accuracy": 99.17, "Clean-Loss": 0.05508732706308365, "PGD-Accuracy": 2.38, "PGD-Loss": 7.876398663330078}, "Total-Time": 18240.011818408966, "Train": {"Loss": 0.9381704232957628, "avg t": 0.9220704754193624, "plain loss": 0.09671723699922913, "standard loss": 0.07621126266541305}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.16616666666667, "Augmented-Loss": 0.06508017979731162, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05391396653652191, "PGD-Accuracy": 2.8666666666666667, "PGD-Loss": 7.813067260742187}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 79, "Epoch-Time": 239.03026413917542, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.40999603271484, "Augmented-0.05-Quantile-Accuracy": 98.11000061035156, "Augmented-0.1-Quantile-Accuracy": 98.3699951171875, "Augmented-Accuracy": 98.9926, "Augmented-Loss": 0.08387595793747903, "Clean-Accuracy": 99.03, "Clean-Loss": 0.0673046901345253, "PGD-Accuracy": 2.63, "PGD-Loss": 7.388931890869141}, "Total-Time": 18479.04208254814, "Train": {"Loss": 0.938181247499254, "avg t": 0.9220684002240499, "plain loss": 0.09487093140284218, "standard loss": 0.07491829623337146}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.81666564941406, "Augmented-0.05-Quantile-Accuracy": 98.43333435058594, "Augmented-0.1-Quantile-Accuracy": 98.56666564941406, "Augmented-Accuracy": 99.06566666666667, "Augmented-Loss": 0.07940788619756699, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.06446397542953491, "PGD-Accuracy": 3.1, "PGD-Loss": 7.363706293741862}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 80, "Epoch-Time": 241.16620111465454, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.62999725341797, "Augmented-0.05-Quantile-Accuracy": 98.25999450683594, "Augmented-0.1-Quantile-Accuracy": 98.48999786376953, "Augmented-Accuracy": 99.0948, "Augmented-Loss": 0.07187041428244113, "Clean-Accuracy": 99.18, "Clean-Loss": 0.056454913461208345, "PGD-Accuracy": 2.12, "PGD-Loss": 7.54930442199707}, "Total-Time": 18720.208283662796, "Train": {"Loss": 0.9381519416879724, "avg t": 0.922063208632999, "plain loss": 0.09685836643996064, "standard loss": 0.07218115505465755}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.03333282470703, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.15733333333333, "Augmented-Loss": 0.06774071638921897, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05408540437618892, "PGD-Accuracy": 2.8666666666666667, "PGD-Loss": 7.442092946370443}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 81, "Epoch-Time": 241.34811735153198, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.52999877929688, "Augmented-0.05-Quantile-Accuracy": 98.32999420166016, "Augmented-0.1-Quantile-Accuracy": 98.50999450683594, "Augmented-Accuracy": 99.0344, "Augmented-Loss": 0.08056408565878868, "Clean-Accuracy": 99.12, "Clean-Loss": 0.061353209817409514, "PGD-Accuracy": 3.9, "PGD-Loss": 7.396638934326172}, "Total-Time": 18961.556401014328, "Train": {"Loss": 0.9382061523861355, "avg t": 0.9220562330351936, "plain loss": 0.09431009043587582, "standard loss": 0.07176720769758578}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.0935, "Augmented-Loss": 0.07571667904933294, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.05859456580877304, "PGD-Accuracy": 4.183333333333334, "PGD-Loss": 7.376214599609375}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 82, "Epoch-Time": 241.5205054283142, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.80999755859375, "Augmented-0.05-Quantile-Accuracy": 98.30999755859375, "Augmented-0.1-Quantile-Accuracy": 98.54000091552734, "Augmented-Accuracy": 99.0805, "Augmented-Loss": 0.08294677537059784, "Clean-Accuracy": 99.15, "Clean-Loss": 0.06384235727787017, "PGD-Accuracy": 4.9, "PGD-Loss": 7.120029061889649}, "Total-Time": 19203.076906442642, "Train": {"Loss": 0.9381168442655493, "avg t": 0.9220569877271299, "plain loss": 0.09679690896140195, "standard loss": 0.07575381175676982}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.06666564941406, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.19283333333334, "Augmented-Loss": 0.0771457074958086, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.05975363129377365, "PGD-Accuracy": 5.216666666666667, "PGD-Loss": 7.013351170857748}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 83, "Epoch-Time": 207.6856837272644, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68999481201172, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 99.0677, "Augmented-Loss": 0.08015829356575012, "Clean-Accuracy": 99.12, "Clean-Loss": 0.061331294786930085, "PGD-Accuracy": 2.17, "PGD-Loss": 8.045132421875}, "Total-Time": 19410.762590169907, "Train": {"Loss": 0.9381089096952367, "avg t": 0.922048708403552, "plain loss": 0.09111357207474889, "standard loss": 0.06794040880379854}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.83333587646484, "Augmented-0.05-Quantile-Accuracy": 98.4000015258789, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 99.09666666666666, "Augmented-Loss": 0.07618027155379455, "Clean-Accuracy": 99.15, "Clean-Loss": 0.059218169162670774, "PGD-Accuracy": 2.216666666666667, "PGD-Loss": 7.9360224609375}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 84, "Epoch-Time": 223.58428931236267, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.91999816894531, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.1476, "Augmented-Loss": 0.06457418441140651, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05277705452442169, "PGD-Accuracy": 1.69, "PGD-Loss": 7.782342010498047}, "Total-Time": 19634.34687948227, "Train": {"Loss": 0.9381556570618241, "avg t": 0.922061569319831, "plain loss": 0.0960242126800396, "standard loss": 0.07405008722013898}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.19366666666667, "Augmented-Loss": 0.06216301036844651, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.051785784969727196, "PGD-Accuracy": 1.9666666666666666, "PGD-Loss": 7.667126200358073}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 85, "Epoch-Time": 241.6402871608734, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.91999816894531, "Augmented-0.05-Quantile-Accuracy": 98.3499984741211, "Augmented-0.1-Quantile-Accuracy": 98.61000061035156, "Augmented-Accuracy": 99.1298, "Augmented-Loss": 0.06698838669431209, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05645737336874008, "PGD-Accuracy": 2.14, "PGD-Loss": 8.143792785644532}, "Total-Time": 19875.987166643143, "Train": {"Loss": 0.9381515586464494, "avg t": 0.9220512648865029, "plain loss": 0.0957852685840041, "standard loss": 0.07434506545684956}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.20233333333333, "Augmented-Loss": 0.06358143376628558, "Clean-Accuracy": 99.2, "Clean-Loss": 0.053815403372049334, "PGD-Accuracy": 2.65, "PGD-Loss": 8.122152084350587}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 86, "Epoch-Time": 241.37064695358276, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.83999633789062, "Augmented-0.05-Quantile-Accuracy": 98.36000061035156, "Augmented-0.1-Quantile-Accuracy": 98.5999984741211, "Augmented-Accuracy": 99.1293, "Augmented-Loss": 0.07547212533020974, "Clean-Accuracy": 99.19, "Clean-Loss": 0.06284179240465164, "PGD-Accuracy": 2.85, "PGD-Loss": 7.823177728271484}, "Total-Time": 20117.357813596725, "Train": {"Loss": 0.9381302456502562, "avg t": 0.9220575986085114, "plain loss": 0.09670266274699464, "standard loss": 0.07981770935323504}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.17816666666667, "Augmented-Loss": 0.07072186436096828, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.05928456404805183, "PGD-Accuracy": 3.45, "PGD-Loss": 7.763642278035482}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 87, "Epoch-Time": 241.4191176891327, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1335, "Augmented-Loss": 0.06467939133906364, "Clean-Accuracy": 99.18, "Clean-Loss": 0.0536306140422821, "PGD-Accuracy": 1.81, "PGD-Loss": 8.572154650878906}, "Total-Time": 20358.776931285858, "Train": {"Loss": 0.9381927810598303, "avg t": 0.9220682875491955, "plain loss": 0.09526381957972498, "standard loss": 0.07748079153122725}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.20883333333333, "Augmented-Loss": 0.06163371496289968, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.051599637965361274, "PGD-Accuracy": 2.1333333333333333, "PGD-Loss": 8.525136367797852}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 88, "Epoch-Time": 215.10416316986084, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93999481201172, "Augmented-0.05-Quantile-Accuracy": 98.43000030517578, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.1706, "Augmented-Loss": 0.07404945256984234, "Clean-Accuracy": 99.24, "Clean-Loss": 0.05878320920467377, "PGD-Accuracy": 3.74, "PGD-Loss": 7.693738330078125}, "Total-Time": 20573.88109445572, "Train": {"Loss": 0.9381212288362009, "avg t": 0.9220553965745149, "plain loss": 0.09360025307337441, "standard loss": 0.07294312935846824}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.25, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.2035, "Augmented-Loss": 0.07108007272620996, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05722132662932078, "PGD-Accuracy": 4.066666666666666, "PGD-Loss": 7.5645895741780596}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 89, "Epoch-Time": 210.54084253311157, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72000122070312, "Augmented-0.05-Quantile-Accuracy": 98.43000030517578, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.1254, "Augmented-Loss": 0.05809636997413635, "Clean-Accuracy": 99.19, "Clean-Loss": 0.04566024218201637, "PGD-Accuracy": 1.86, "PGD-Loss": 8.16799658203125}, "Total-Time": 20784.42193698883, "Train": {"Loss": 0.9381052137657448, "avg t": 0.9220532745431971, "plain loss": 0.09438526586426636, "standard loss": 0.07217734835324464}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.19, "Augmented-Loss": 0.054644026594062645, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.04357873088121414, "PGD-Accuracy": 1.85, "PGD-Loss": 8.20552345275879}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 90, "Epoch-Time": 240.97065496444702, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.32999420166016, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 99.134, "Augmented-Loss": 0.07466789400053024, "Clean-Accuracy": 99.23, "Clean-Loss": 0.059141303396224976, "PGD-Accuracy": 2.58, "PGD-Loss": 7.199354653930664}, "Total-Time": 21025.392591953278, "Train": {"Loss": 0.9381513140996297, "avg t": 0.9220563943121168, "plain loss": 0.094884399594201, "standard loss": 0.0728891582025422}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.24133333333333, "Augmented-Loss": 0.06984636994918188, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.055957816700140633, "PGD-Accuracy": 3.066666666666667, "PGD-Loss": 7.112775527954102}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 91, "Epoch-Time": 241.49257731437683, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.98999786376953, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1937, "Augmented-Loss": 0.06692822874438763, "Clean-Accuracy": 99.27, "Clean-Loss": 0.0536559619307518, "PGD-Accuracy": 2.31, "PGD-Loss": 7.845136077880859}, "Total-Time": 21266.885169267654, "Train": {"Loss": 0.9381616992950439, "avg t": 0.9220553155828405, "plain loss": 0.09358681177563144, "standard loss": 0.0742602671428963}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.222, "Augmented-Loss": 0.06340976869642735, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05141608941555023, "PGD-Accuracy": 2.6166666666666667, "PGD-Loss": 7.791540486653646}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 92, "Epoch-Time": 241.49497842788696, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.88999938964844, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.1799, "Augmented-Loss": 0.07733800986766816, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05819371778964996, "PGD-Accuracy": 4.16, "PGD-Loss": 7.040554541015625}, "Total-Time": 21508.38014769554, "Train": {"Loss": 0.9380694649484422, "avg t": 0.9220404946715743, "plain loss": 0.08956075554600468, "standard loss": 0.06746846924667005}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.2105, "Augmented-Loss": 0.07320105710665385, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.055817476590474445, "PGD-Accuracy": 4.566666666666666, "PGD-Loss": 7.003024495442708}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 93, "Epoch-Time": 241.3284032344818, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79999542236328, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.2036, "Augmented-Loss": 0.06676105757164955, "Clean-Accuracy": 99.27, "Clean-Loss": 0.0513284658074379, "PGD-Accuracy": 1.79, "PGD-Loss": 7.781251110839844}, "Total-Time": 21749.708550930023, "Train": {"Loss": 0.9381442046695285, "avg t": 0.9220592380276432, "plain loss": 0.0972050881297499, "standard loss": 0.07498500538755347}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.26466666666667, "Augmented-Loss": 0.062039719778100647, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.04830557304620743, "PGD-Accuracy": 2.2333333333333334, "PGD-Loss": 7.736439147949219}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 94, "Epoch-Time": 203.00001454353333, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.88999938964844, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.179, "Augmented-Loss": 0.06583577826225757, "Clean-Accuracy": 99.29, "Clean-Loss": 0.05043208870887756, "PGD-Accuracy": 2.01, "PGD-Loss": 7.885464935302735}, "Total-Time": 21952.708565473557, "Train": {"Loss": 0.9380579615698921, "avg t": 0.9220342090218155, "plain loss": 0.09053566043465223, "standard loss": 0.06749728987614313}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.25633333333333, "Augmented-Loss": 0.062085338248213134, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.04832807120680809, "PGD-Accuracy": 2.683333333333333, "PGD-Loss": 7.7952445780436195}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 95, "Epoch-Time": 225.20343017578125, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.8499984741211, "Augmented-0.05-Quantile-Accuracy": 98.38999938964844, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.1811, "Augmented-Loss": 0.06556275666332245, "Clean-Accuracy": 99.27, "Clean-Loss": 0.04997223805785179, "PGD-Accuracy": 2.28, "PGD-Loss": 7.639858117675781}, "Total-Time": 22177.911995649338, "Train": {"Loss": 0.9380745523417438, "avg t": 0.9220338712621619, "plain loss": 0.08963651021321603, "standard loss": 0.06840957135624355}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.25083333333333, "Augmented-Loss": 0.06225358240862688, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.04830930478374163, "PGD-Accuracy": 2.683333333333333, "PGD-Loss": 7.6070901285807295}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 96, "Epoch-Time": 241.5205512046814, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.70999908447266, "Augmented-Accuracy": 99.2251, "Augmented-Loss": 0.06434638080072402, "Clean-Accuracy": 99.32, "Clean-Loss": 0.05121701164245605, "PGD-Accuracy": 1.7, "PGD-Loss": 7.777052551269532}, "Total-Time": 22419.43254685402, "Train": {"Loss": 0.938090082610095, "avg t": 0.9220438873326336, "plain loss": 0.09198956903351672, "standard loss": 0.06925634710435515}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.2355, "Augmented-Loss": 0.06044323207428058, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.048793491760889686, "PGD-Accuracy": 2.1, "PGD-Loss": 7.621254364013672}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 97, "Epoch-Time": 241.0025384426117, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.77999877929688, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1275, "Augmented-Loss": 0.07653425332212448, "Clean-Accuracy": 99.15, "Clean-Loss": 0.061663132190704344, "PGD-Accuracy": 2.5, "PGD-Loss": 7.371902075195313}, "Total-Time": 22660.43508529663, "Train": {"Loss": 0.9380968493179038, "avg t": 0.9220566820921722, "plain loss": 0.09515875067181054, "standard loss": 0.07444720536470413}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.1585, "Augmented-Loss": 0.0723617236183087, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.0589987749059995, "PGD-Accuracy": 3.1666666666666665, "PGD-Loss": 7.259203450520833}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 98, "Epoch-Time": 240.8365352153778, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.81999969482422, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.138, "Augmented-Loss": 0.07664184334421158, "Clean-Accuracy": 99.25, "Clean-Loss": 0.057888911044597625, "PGD-Accuracy": 3.73, "PGD-Loss": 7.490929141235352}, "Total-Time": 22901.27162051201, "Train": {"Loss": 0.9380819064246284, "avg t": 0.9220401742193434, "plain loss": 0.09095800418147341, "standard loss": 0.06869881116460871}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.12616666666666, "Augmented-Loss": 0.07289853072285653, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05609544689456622, "PGD-Accuracy": 4.066666666666666, "PGD-Loss": 7.429293411254883}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 99, "Epoch-Time": 212.65320897102356, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.89999389648438, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.197, "Augmented-Loss": 0.062248021577000615, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04758509203195572, "PGD-Accuracy": 1.3, "PGD-Loss": 8.327401556396484}, "Total-Time": 23113.924829483032, "Train": {"Loss": 0.9380697275797526, "avg t": 0.9220370063958344, "plain loss": 0.09549243039378418, "standard loss": 0.07223983888052128}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.94999694824219, "Augmented-Accuracy": 99.26683333333334, "Augmented-Loss": 0.05924587175011635, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.04636607017119725, "PGD-Accuracy": 1.55, "PGD-Loss": 8.210710240681966}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 100, "Epoch-Time": 212.2561104297638, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.83999633789062, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.55999755859375, "Augmented-Accuracy": 99.1549, "Augmented-Loss": 0.06180172241842747, "Clean-Accuracy": 99.26, "Clean-Loss": 0.04861112607121468, "PGD-Accuracy": 1.35, "PGD-Loss": 8.656153424072265}, "Total-Time": 23326.180939912796, "Train": {"Loss": 0.9381258942286174, "avg t": 0.9220469416865597, "plain loss": 0.09274702778568969, "standard loss": 0.06953823273270218}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.20666666666666, "Augmented-Loss": 0.059926462450126804, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.048352966060241066, "PGD-Accuracy": 1.9833333333333334, "PGD-Loss": 8.541783432006836}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 101, "Epoch-Time": 241.7030987739563, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.91999816894531, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.2041, "Augmented-Loss": 0.07181385732352734, "Clean-Accuracy": 99.26, "Clean-Loss": 0.05238985390663147, "PGD-Accuracy": 4.08, "PGD-Loss": 7.348641052246093}, "Total-Time": 23567.884038686752, "Train": {"Loss": 0.9380332236996404, "avg t": 0.9220344498245805, "plain loss": 0.09457319066082996, "standard loss": 0.06834616365918407}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.276, "Augmented-Loss": 0.06754761353194713, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05026821834842364, "PGD-Accuracy": 4.133333333333334, "PGD-Loss": 7.182399993896484}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 102, "Epoch-Time": 241.26767230033875, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.81999969482422, "Augmented-0.05-Quantile-Accuracy": 98.43000030517578, "Augmented-0.1-Quantile-Accuracy": 98.6199951171875, "Augmented-Accuracy": 99.167, "Augmented-Loss": 0.06589876048350334, "Clean-Accuracy": 99.26, "Clean-Loss": 0.05005925515294075, "PGD-Accuracy": 2.27, "PGD-Loss": 7.3483747924804685}, "Total-Time": 23809.15171098709, "Train": {"Loss": 0.938113507270813, "avg t": 0.9220437572620533, "plain loss": 0.09192564880583033, "standard loss": 0.06499118354806194}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.36666870117188, "Augmented-0.05-Quantile-Accuracy": 98.75, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.21283333333334, "Augmented-Loss": 0.06163151878943046, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.04768078037103017, "PGD-Accuracy": 2.7666666666666666, "PGD-Loss": 7.303892272949219}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 103, "Epoch-Time": 241.396568775177, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.86000061035156, "Augmented-0.05-Quantile-Accuracy": 98.43999481201172, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.1753, "Augmented-Loss": 0.07708236371827125, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05752227965593338, "PGD-Accuracy": 3.36, "PGD-Loss": 6.306550839233399}, "Total-Time": 24050.548279762268, "Train": {"Loss": 0.9380352043752317, "avg t": 0.9220400772977758, "plain loss": 0.09253670388327709, "standard loss": 0.0677720056463171}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.22833333333334, "Augmented-Loss": 0.07182638235310713, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05412799525260925, "PGD-Accuracy": 4.116666666666666, "PGD-Loss": 6.206684997558594}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 104, "Epoch-Time": 239.68248963356018, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.95999908447266, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.66999816894531, "Augmented-Accuracy": 99.17, "Augmented-Loss": 0.06569611897230149, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05118433629274368, "PGD-Accuracy": 2.88, "PGD-Loss": 6.925543814086914}, "Total-Time": 24290.23076939583, "Train": {"Loss": 0.9380185070744267, "avg t": 0.9220215731903358, "plain loss": 0.0929581009176043, "standard loss": 0.06926594218942854}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.23033333333333, "Augmented-Loss": 0.062089371333122256, "Clean-Accuracy": 99.35, "Clean-Loss": 0.049116520206133524, "PGD-Accuracy": 3.3666666666666667, "PGD-Loss": 6.778632731119791}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 105, "Epoch-Time": 204.9055676460266, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.5199966430664, "Augmented-0.1-Quantile-Accuracy": 98.72000122070312, "Augmented-Accuracy": 99.1566, "Augmented-Loss": 0.06936536049461364, "Clean-Accuracy": 99.23, "Clean-Loss": 0.05108334400653839, "PGD-Accuracy": 2.83, "PGD-Loss": 7.236475173950195}, "Total-Time": 24495.136337041855, "Train": {"Loss": 0.9380675417228981, "avg t": 0.9220339205000135, "plain loss": 0.09248367451561827, "standard loss": 0.0687461027569241}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.23016666666666, "Augmented-Loss": 0.06388211303154627, "Clean-Accuracy": 99.38333333333334, "Clean-Loss": 0.047557420551776884, "PGD-Accuracy": 3.0833333333333335, "PGD-Loss": 7.2245575714111325}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 106, "Epoch-Time": 226.74712109565735, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.192, "Augmented-Loss": 0.05816492431807518, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04441802712678909, "PGD-Accuracy": 1.6, "PGD-Loss": 7.9791262817382815}, "Total-Time": 24721.883458137512, "Train": {"Loss": 0.9380281656053331, "avg t": 0.9220322647977758, "plain loss": 0.08983276887469825, "standard loss": 0.06568718861650538}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.86666870117188, "Augmented-0.1-Quantile-Accuracy": 99.0, "Augmented-Accuracy": 99.26166666666667, "Augmented-Loss": 0.0545854324199756, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.042576001852750775, "PGD-Accuracy": 1.7833333333333334, "PGD-Loss": 7.88144135538737}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 107, "Epoch-Time": 241.38385558128357, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.95999908447266, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.7699966430664, "Augmented-Accuracy": 99.2296, "Augmented-Loss": 0.06556607498121261, "Clean-Accuracy": 99.33, "Clean-Loss": 0.051828199350833895, "PGD-Accuracy": 2.79, "PGD-Loss": 6.885346200561523}, "Total-Time": 24963.267313718796, "Train": {"Loss": 0.9380685812102424, "avg t": 0.9220277804092125, "plain loss": 0.08756701092896635, "standard loss": 0.06627014380031161}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.43333435058594, "Augmented-0.05-Quantile-Accuracy": 98.83333587646484, "Augmented-0.1-Quantile-Accuracy": 98.96666717529297, "Augmented-Accuracy": 99.23166666666667, "Augmented-Loss": 0.062485324256519474, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05019851238528887, "PGD-Accuracy": 3.816666666666667, "PGD-Loss": 6.808099909464518}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 108, "Epoch-Time": 241.50477623939514, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.43000030517578, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1482, "Augmented-Loss": 0.06864649957752228, "Clean-Accuracy": 99.22, "Clean-Loss": 0.053997912609577176, "PGD-Accuracy": 3.09, "PGD-Loss": 6.915981481933594}, "Total-Time": 25204.77208995819, "Train": {"Loss": 0.9380396589703031, "avg t": 0.9220257864704838, "plain loss": 0.08861548186054949, "standard loss": 0.06707058119332349}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.224, "Augmented-Loss": 0.06353430303394794, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05035229351123174, "PGD-Accuracy": 3.3, "PGD-Loss": 6.865375498453776}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 109, "Epoch-Time": 241.44429874420166, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.1904, "Augmented-Loss": 0.0645410408834219, "Clean-Accuracy": 99.28, "Clean-Loss": 0.05193176866769791, "PGD-Accuracy": 1.9, "PGD-Loss": 7.559339996337891}, "Total-Time": 25446.216388702393, "Train": {"Loss": 0.9380624619589911, "avg t": 0.9220347397415726, "plain loss": 0.09182014372790309, "standard loss": 0.07012164878182942}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.16716666666666, "Augmented-Loss": 0.06149961607237657, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05023541215062141, "PGD-Accuracy": 2.4833333333333334, "PGD-Loss": 7.581327158610026}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 110, "Epoch-Time": 209.52791547775269, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.02999877929688, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.1802, "Augmented-Loss": 0.060462228769659995, "Clean-Accuracy": 99.28, "Clean-Loss": 0.04929625498056412, "PGD-Accuracy": 1.58, "PGD-Loss": 8.083599426269531}, "Total-Time": 25655.744304180145, "Train": {"Loss": 0.9380549686219957, "avg t": 0.9220286321640014, "plain loss": 0.08918236409293286, "standard loss": 0.06912946477422008}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.246, "Augmented-Loss": 0.05699338139653206, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.047220466901858646, "PGD-Accuracy": 1.95, "PGD-Loss": 8.016349283854167}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 111, "Epoch-Time": 214.65364503860474, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75, "Augmented-0.05-Quantile-Accuracy": 98.36000061035156, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1459, "Augmented-Loss": 0.06320836278307437, "Clean-Accuracy": 99.28, "Clean-Loss": 0.05030929754972458, "PGD-Accuracy": 1.67, "PGD-Loss": 7.368612045288086}, "Total-Time": 25870.39794921875, "Train": {"Loss": 0.938052162611926, "avg t": 0.9220278752115038, "plain loss": 0.09010763815773845, "standard loss": 0.07017891351823453}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.21233333333333, "Augmented-Loss": 0.05893247822721799, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.04743172353506088, "PGD-Accuracy": 2.2333333333333334, "PGD-Loss": 7.260701909383138}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 112, "Epoch-Time": 241.39408206939697, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.98999786376953, "Augmented-0.05-Quantile-Accuracy": 98.50999450683594, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.2242, "Augmented-Loss": 0.06198896530032158, "Clean-Accuracy": 99.29, "Clean-Loss": 0.0501294415473938, "PGD-Accuracy": 1.93, "PGD-Loss": 7.933377355957031}, "Total-Time": 26111.792031288147, "Train": {"Loss": 0.9380102115913673, "avg t": 0.92202205686216, "plain loss": 0.08739239026175606, "standard loss": 0.06785962632850365}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.2515, "Augmented-Loss": 0.059114011918803056, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04857659288744132, "PGD-Accuracy": 2.1, "PGD-Loss": 7.848013168334961}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 113, "Epoch-Time": 241.48625946044922, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93999481201172, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.66999816894531, "Augmented-Accuracy": 99.1481, "Augmented-Loss": 0.06206445420730114, "Clean-Accuracy": 99.19, "Clean-Loss": 0.04957340550422668, "PGD-Accuracy": 0.9, "PGD-Loss": 7.936515423583985}, "Total-Time": 26353.278290748596, "Train": {"Loss": 0.9380100598865085, "avg t": 0.9220251754831384, "plain loss": 0.08916486684481308, "standard loss": 0.06862908179230161}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.75, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.21333333333334, "Augmented-Loss": 0.05911459384739399, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.047848713278770445, "PGD-Accuracy": 1.3, "PGD-Loss": 7.83111506652832}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 114, "Epoch-Time": 241.91118669509888, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97999572753906, "Augmented-0.05-Quantile-Accuracy": 98.6199951171875, "Augmented-0.1-Quantile-Accuracy": 98.81999969482422, "Augmented-Accuracy": 99.2144, "Augmented-Loss": 0.062180667775154116, "Clean-Accuracy": 99.23, "Clean-Loss": 0.049083323395252225, "PGD-Accuracy": 2.05, "PGD-Loss": 7.458452551269532}, "Total-Time": 26595.189477443695, "Train": {"Loss": 0.9380222541667796, "avg t": 0.9220272008577982, "plain loss": 0.09008701625400113, "standard loss": 0.06673197991980447}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.4000015258789, "Augmented-0.05-Quantile-Accuracy": 98.83333587646484, "Augmented-0.1-Quantile-Accuracy": 98.96666717529297, "Augmented-Accuracy": 99.26733333333334, "Augmented-Loss": 0.05875072618067265, "Clean-Accuracy": 99.35, "Clean-Loss": 0.047048337678114574, "PGD-Accuracy": 2.216666666666667, "PGD-Loss": 7.34385844930013}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 115, "Epoch-Time": 239.28989386558533, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.5199966430664, "Augmented-0.1-Quantile-Accuracy": 98.79000091552734, "Augmented-Accuracy": 99.2106, "Augmented-Loss": 0.0678106822065115, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05265277873277664, "PGD-Accuracy": 1.72, "PGD-Loss": 7.484737829589844}, "Total-Time": 26834.47937130928, "Train": {"Loss": 0.9380696001052856, "avg t": 0.9220286478996277, "plain loss": 0.08990168104878174, "standard loss": 0.06804318135976792}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.2715, "Augmented-Loss": 0.06332310023456812, "Clean-Accuracy": 99.38333333333334, "Clean-Loss": 0.0497373026907444, "PGD-Accuracy": 2.1166666666666667, "PGD-Loss": 7.458910700480144}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 116, "Epoch-Time": 204.3063588142395, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.00999450683594, "Augmented-0.05-Quantile-Accuracy": 98.57999420166016, "Augmented-0.1-Quantile-Accuracy": 98.75999450683594, "Augmented-Accuracy": 99.1874, "Augmented-Loss": 0.06430863675963878, "Clean-Accuracy": 99.23, "Clean-Loss": 0.04959233341217041, "PGD-Accuracy": 1.95, "PGD-Loss": 7.364688952636719}, "Total-Time": 27038.78573012352, "Train": {"Loss": 0.9380477386933785, "avg t": 0.9220233420089439, "plain loss": 0.08880003578044748, "standard loss": 0.06600160510672463}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.23716666666667, "Augmented-Loss": 0.061565478040675324, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04838220805923144, "PGD-Accuracy": 2.25, "PGD-Loss": 7.279202555338542}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 117, "Epoch-Time": 227.8259880542755, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.00999450683594, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.80999755859375, "Augmented-Accuracy": 99.2013, "Augmented-Loss": 0.07175139858579635, "Clean-Accuracy": 99.23, "Clean-Loss": 0.05447716697454452, "PGD-Accuracy": 1.93, "PGD-Loss": 7.487122741699219}, "Total-Time": 27266.611718177795, "Train": {"Loss": 0.937993219534556, "avg t": 0.9220213337297792, "plain loss": 0.09125252179039846, "standard loss": 0.06672012585180777}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.25, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.25766666666667, "Augmented-Loss": 0.0677750804211696, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.05204891430338224, "PGD-Accuracy": 2.3, "PGD-Loss": 7.453298975626628}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 118, "Epoch-Time": 241.39778852462769, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.86000061035156, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.153, "Augmented-Loss": 0.07329835167145729, "Clean-Accuracy": 99.15, "Clean-Loss": 0.05558263887166977, "PGD-Accuracy": 3.43, "PGD-Loss": 6.917271603393555}, "Total-Time": 27508.009506702423, "Train": {"Loss": 0.9380281340634381, "avg t": 0.922019902865092, "plain loss": 0.09181333881130938, "standard loss": 0.06749975859566971}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.24183333333333, "Augmented-Loss": 0.06699083058377107, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05124051203330358, "PGD-Accuracy": 3.5, "PGD-Loss": 6.851030298868815}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 119, "Epoch-Time": 241.52848029136658, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97999572753906, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.2269, "Augmented-Loss": 0.07019905719983578, "Clean-Accuracy": 99.32, "Clean-Loss": 0.05443373708724976, "PGD-Accuracy": 1.79, "PGD-Loss": 7.491907019042968}, "Total-Time": 27749.53798699379, "Train": {"Loss": 0.9380208027097914, "avg t": 0.9220246601104737, "plain loss": 0.09156938503406659, "standard loss": 0.0686654895234991}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.94999694824219, "Augmented-Accuracy": 99.22316666666667, "Augmented-Loss": 0.06755110317885876, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05349895908435186, "PGD-Accuracy": 1.8333333333333333, "PGD-Loss": 7.320695805867513}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 120, "Epoch-Time": 241.4978370666504, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.80999755859375, "Augmented-0.05-Quantile-Accuracy": 98.37999725341797, "Augmented-0.1-Quantile-Accuracy": 98.5999984741211, "Augmented-Accuracy": 99.1231, "Augmented-Loss": 0.0752539842274189, "Clean-Accuracy": 99.17, "Clean-Loss": 0.057429668390750886, "PGD-Accuracy": 2.83, "PGD-Loss": 7.509664892578125}, "Total-Time": 27991.03582406044, "Train": {"Loss": 0.9380330146860193, "avg t": 0.9220208517357155, "plain loss": 0.0904018586476643, "standard loss": 0.06803349069092009}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.18233333333333, "Augmented-Loss": 0.07052686215619246, "Clean-Accuracy": 99.2, "Clean-Loss": 0.054451893438895546, "PGD-Accuracy": 2.8, "PGD-Loss": 7.498043416341146}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 121, "Epoch-Time": 207.64674258232117, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.8699951171875, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.2101, "Augmented-Loss": 0.06534467539644241, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05067037922143936, "PGD-Accuracy": 1.84, "PGD-Loss": 7.430610443115234}, "Total-Time": 28198.68256664276, "Train": {"Loss": 0.9380684750521624, "avg t": 0.9220281000843754, "plain loss": 0.09288246747829296, "standard loss": 0.07172869401066391}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.25, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.22316666666667, "Augmented-Loss": 0.06291908516307672, "Clean-Accuracy": 99.3, "Clean-Loss": 0.049959494123856224, "PGD-Accuracy": 1.7666666666666666, "PGD-Loss": 7.398169514973958}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 122, "Epoch-Time": 217.29935693740845, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93000030517578, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.70999908447266, "Augmented-Accuracy": 99.2171, "Augmented-Loss": 0.06470344770669938, "Clean-Accuracy": 99.3, "Clean-Loss": 0.049852488327026365, "PGD-Accuracy": 1.22, "PGD-Loss": 7.832359930419922}, "Total-Time": 28415.98192358017, "Train": {"Loss": 0.9379885446053964, "avg t": 0.9220181023633038, "plain loss": 0.08843376341219297, "standard loss": 0.06677942541020888}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.25116666666666, "Augmented-Loss": 0.0608965392562747, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04740589449803034, "PGD-Accuracy": 1.4333333333333333, "PGD-Loss": 7.7846126505533855}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 123, "Epoch-Time": 241.48531794548035, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.86000061035156, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1322, "Augmented-Loss": 0.07788350192379952, "Clean-Accuracy": 99.19, "Clean-Loss": 0.06087847064733505, "PGD-Accuracy": 2.93, "PGD-Loss": 7.058997174072266}, "Total-Time": 28657.46724152565, "Train": {"Loss": 0.9380430017047459, "avg t": 0.9220238412221273, "plain loss": 0.08961927045892781, "standard loss": 0.06762766707605786}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.19616666666667, "Augmented-Loss": 0.07193626257558663, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.056759945650895434, "PGD-Accuracy": 3.55, "PGD-Loss": 7.020464645385742}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 124, "Epoch-Time": 241.37422800064087, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97999572753906, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.2121, "Augmented-Loss": 0.07559604602527618, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05724081177711487, "PGD-Accuracy": 4.53, "PGD-Loss": 6.679744064331055}, "Total-Time": 28898.84146952629, "Train": {"Loss": 0.9379601452438919, "avg t": 0.9220105791445131, "plain loss": 0.08967344307546277, "standard loss": 0.06720154816905657}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.20633333333333, "Augmented-Loss": 0.07262475362598896, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05599579075972239, "PGD-Accuracy": 4.433333333333334, "PGD-Loss": 6.637280741373698}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 125, "Epoch-Time": 241.40426635742188, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.54000091552734, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.1846, "Augmented-Loss": 0.06676960763549805, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05149154092073441, "PGD-Accuracy": 3.29, "PGD-Loss": 7.073720016479492}, "Total-Time": 29140.245735883713, "Train": {"Loss": 0.9379728648574264, "avg t": 0.9220154822490834, "plain loss": 0.08836806487154088, "standard loss": 0.06409914984526457}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.2225, "Augmented-Loss": 0.0637160875761509, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05010431591669719, "PGD-Accuracy": 3.3, "PGD-Loss": 6.968619150797526}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 126, "Epoch-Time": 239.59811186790466, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0199966430664, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.2117, "Augmented-Loss": 0.0724597645791769, "Clean-Accuracy": 99.23, "Clean-Loss": 0.05662426942586899, "PGD-Accuracy": 3.81, "PGD-Loss": 7.172919537353516}, "Total-Time": 29379.843847751617, "Train": {"Loss": 0.9380105777316623, "avg t": 0.922016431260992, "plain loss": 0.09070295228075094, "standard loss": 0.06785602522337879}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.23283333333333, "Augmented-Loss": 0.06878045683403809, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.054483006407817204, "PGD-Accuracy": 4.016666666666667, "PGD-Loss": 7.117667663574219}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 127, "Epoch-Time": 202.75385689735413, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.98999786376953, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.2066, "Augmented-Loss": 0.06605390195214748, "Clean-Accuracy": 99.25, "Clean-Loss": 0.053608473801612856, "PGD-Accuracy": 2.34, "PGD-Loss": 7.671365472412109}, "Total-Time": 29582.59770464897, "Train": {"Loss": 0.93796613184611, "avg t": 0.9220123152732849, "plain loss": 0.08843802746490188, "standard loss": 0.06852103475729625}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.24433333333333, "Augmented-Loss": 0.06314400788108508, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.05201167691747347, "PGD-Accuracy": 2.6166666666666667, "PGD-Loss": 7.619255071004232}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 128, "Epoch-Time": 230.4065351486206, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72000122070312, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.124, "Augmented-Loss": 0.06369018184077739, "Clean-Accuracy": 99.15, "Clean-Loss": 0.049556633669137956, "PGD-Accuracy": 1.14, "PGD-Loss": 7.804913482666016}, "Total-Time": 29813.004239797592, "Train": {"Loss": 0.9380064685432999, "avg t": 0.9220240661656415, "plain loss": 0.0868180747173451, "standard loss": 0.06656200594592977}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.51666259765625, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.19633333333333, "Augmented-Loss": 0.06098871897041798, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.04837214158972104, "PGD-Accuracy": 1.1833333333333333, "PGD-Loss": 7.6599765930175785}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 129, "Epoch-Time": 241.30010747909546, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.00999450683594, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1852, "Augmented-Loss": 0.06691776030683518, "Clean-Accuracy": 99.26, "Clean-Loss": 0.051457270073890685, "PGD-Accuracy": 2.31, "PGD-Loss": 7.426796066284179}, "Total-Time": 30054.304347276688, "Train": {"Loss": 0.9379904438477975, "avg t": 0.9220160124920033, "plain loss": 0.08639251103931, "standard loss": 0.06371170541533717}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.43333435058594, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.29883333333333, "Augmented-Loss": 0.06274206240127483, "Clean-Accuracy": 99.38333333333334, "Clean-Loss": 0.048784603267908094, "PGD-Accuracy": 2.783333333333333, "PGD-Loss": 7.348596801757813}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 130, "Epoch-Time": 241.21716284751892, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.66999816894531, "Augmented-Accuracy": 99.1347, "Augmented-Loss": 0.06883735788619519, "Clean-Accuracy": 99.17, "Clean-Loss": 0.053446860933303836, "PGD-Accuracy": 1.96, "PGD-Loss": 7.138108892822266}, "Total-Time": 30295.521510124207, "Train": {"Loss": 0.9379735602626094, "avg t": 0.9220143243471781, "plain loss": 0.0893351477587664, "standard loss": 0.06563818645477294}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.22466666666666, "Augmented-Loss": 0.06556223217686018, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.05182907395561536, "PGD-Accuracy": 2.566666666666667, "PGD-Loss": 7.071120061238607}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 131, "Epoch-Time": 241.39113664627075, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.04000091552734, "Augmented-0.05-Quantile-Accuracy": 98.61000061035156, "Augmented-0.1-Quantile-Accuracy": 98.79000091552734, "Augmented-Accuracy": 99.2367, "Augmented-Loss": 0.06624301253783703, "Clean-Accuracy": 99.29, "Clean-Loss": 0.053120314991474155, "PGD-Accuracy": 2.33, "PGD-Loss": 7.647240393066406}, "Total-Time": 30536.912646770477, "Train": {"Loss": 0.9379624549018012, "avg t": 0.9220084408124288, "plain loss": 0.08926744862485816, "standard loss": 0.06839310475190481}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.98332977294922, "Augmented-Accuracy": 99.25816666666667, "Augmented-Loss": 0.06423712470511596, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.05223974820971489, "PGD-Accuracy": 2.2666666666666666, "PGD-Loss": 7.587094828287761}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 132, "Epoch-Time": 204.72836828231812, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93999481201172, "Augmented-0.05-Quantile-Accuracy": 98.54000091552734, "Augmented-0.1-Quantile-Accuracy": 98.77999877929688, "Augmented-Accuracy": 99.2164, "Augmented-Loss": 0.07050633359992504, "Clean-Accuracy": 99.31, "Clean-Loss": 0.055798829340934754, "PGD-Accuracy": 2.38, "PGD-Loss": 6.915944949340821}, "Total-Time": 30741.641015052795, "Train": {"Loss": 0.9379181547871343, "avg t": 0.9220009318457709, "plain loss": 0.08695589201008821, "standard loss": 0.06767675179463846}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.21633333333334, "Augmented-Loss": 0.06695462516168753, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05399884392817815, "PGD-Accuracy": 2.85, "PGD-Loss": 6.778244481404623}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 133, "Epoch-Time": 219.02656865119934, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.91999816894531, "Augmented-0.05-Quantile-Accuracy": 98.5199966430664, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.1884, "Augmented-Loss": 0.06564357247567176, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05045189734697342, "PGD-Accuracy": 2.29, "PGD-Loss": 7.331983303833008}, "Total-Time": 30960.667583703995, "Train": {"Loss": 0.9379649543055781, "avg t": 0.9220104654983238, "plain loss": 0.08775062195106798, "standard loss": 0.06576197417135592}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.24683333333333, "Augmented-Loss": 0.06171113048573335, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04832878322402636, "PGD-Accuracy": 2.3833333333333333, "PGD-Loss": 7.357064503987631}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 134, "Epoch-Time": 241.2658724784851, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.98999786376953, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.1876, "Augmented-Loss": 0.0643632432564497, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04967045242190361, "PGD-Accuracy": 1.65, "PGD-Loss": 7.86653896484375}, "Total-Time": 31201.93345618248, "Train": {"Loss": 0.938017785831734, "avg t": 0.9220106904948199, "plain loss": 0.08700248138639667, "standard loss": 0.06262566656978041}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 99.04999542236328, "Augmented-Accuracy": 99.24766666666666, "Augmented-Loss": 0.0620449148423473, "Clean-Accuracy": 99.25, "Clean-Loss": 0.049019599442680674, "PGD-Accuracy": 2.033333333333333, "PGD-Loss": 7.818757222493489}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 135, "Epoch-Time": 241.43773198127747, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.1531, "Augmented-Loss": 0.07116771291518212, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05299584233164787, "PGD-Accuracy": 2.06, "PGD-Loss": 7.956826873779297}, "Total-Time": 31443.371188163757, "Train": {"Loss": 0.9379957168367173, "avg t": 0.9220020921495226, "plain loss": 0.08530109039059382, "standard loss": 0.06251945282794812}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.18616666666667, "Augmented-Loss": 0.06759504731992881, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05129847823580106, "PGD-Accuracy": 2.4166666666666665, "PGD-Loss": 7.873755330403646}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 136, "Epoch-Time": 241.34228587150574, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93000030517578, "Augmented-0.05-Quantile-Accuracy": 98.55999755859375, "Augmented-0.1-Quantile-Accuracy": 98.82999420166016, "Augmented-Accuracy": 99.2068, "Augmented-Loss": 0.07090075067019462, "Clean-Accuracy": 99.24, "Clean-Loss": 0.053699715268611906, "PGD-Accuracy": 3.1, "PGD-Loss": 7.231222448730469}, "Total-Time": 31684.713474035263, "Train": {"Loss": 0.9379828643445616, "avg t": 0.9220196921737106, "plain loss": 0.08813117144902555, "standard loss": 0.06516438701638469}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.27833333333334, "Augmented-Loss": 0.06686922111431758, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.05124308948715528, "PGD-Accuracy": 2.933333333333333, "PGD-Loss": 7.2184300689697265}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 137, "Epoch-Time": 236.98492550849915, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.50999450683594, "Augmented-0.1-Quantile-Accuracy": 98.75999450683594, "Augmented-Accuracy": 99.2182, "Augmented-Loss": 0.07331944637751579, "Clean-Accuracy": 99.28, "Clean-Loss": 0.055168449079990384, "PGD-Accuracy": 2.84, "PGD-Loss": 7.61063656616211}, "Total-Time": 31921.698399543762, "Train": {"Loss": 0.9380243737256085, "avg t": 0.922017475410744, "plain loss": 0.08790554036034479, "standard loss": 0.06506977846887377}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.93333435058594, "Augmented-0.1-Quantile-Accuracy": 99.01666259765625, "Augmented-Accuracy": 99.28983333333333, "Augmented-Loss": 0.0691271874344349, "Clean-Accuracy": 99.38333333333334, "Clean-Loss": 0.052785855889320374, "PGD-Accuracy": 3.05, "PGD-Loss": 7.635254409790039}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 138, "Epoch-Time": 203.82570219039917, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93000030517578, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.66999816894531, "Augmented-Accuracy": 99.1905, "Augmented-Loss": 0.07295364996540546, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05529084854125976, "PGD-Accuracy": 2.45, "PGD-Loss": 7.003274032592773}, "Total-Time": 32125.52410173416, "Train": {"Loss": 0.9379775630279824, "avg t": 0.9220161083539327, "plain loss": 0.08871244559464646, "standard loss": 0.06477902315943329}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.227, "Augmented-Loss": 0.06923535500546296, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05313867262005806, "PGD-Accuracy": 2.8, "PGD-Loss": 6.939155705769857}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 139, "Epoch-Time": 231.57171964645386, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97000122070312, "Augmented-0.05-Quantile-Accuracy": 98.5199966430664, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1494, "Augmented-Loss": 0.06036359604787826, "Clean-Accuracy": 99.22, "Clean-Loss": 0.04605476529598236, "PGD-Accuracy": 2.66, "PGD-Loss": 7.161434252929688}, "Total-Time": 32357.095821380615, "Train": {"Loss": 0.9379362557729085, "avg t": 0.9219998884554262, "plain loss": 0.08533068242249665, "standard loss": 0.06368229518775587}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.43333435058594, "Augmented-0.05-Quantile-Accuracy": 98.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.22816666666667, "Augmented-Loss": 0.05667356472581625, "Clean-Accuracy": 99.3, "Clean-Loss": 0.044007142846783004, "PGD-Accuracy": 2.8333333333333335, "PGD-Loss": 7.141309392293294}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 140, "Epoch-Time": 241.63126277923584, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.87999725341797, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1668, "Augmented-Loss": 0.06444323817491532, "Clean-Accuracy": 99.21, "Clean-Loss": 0.04836974791288376, "PGD-Accuracy": 2.42, "PGD-Loss": 7.146543753051758}, "Total-Time": 32598.72708415985, "Train": {"Loss": 0.9379730365188034, "avg t": 0.9220083615514967, "plain loss": 0.08874034695978517, "standard loss": 0.0644772212781288}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.17916666666666, "Augmented-Loss": 0.0611845999627312, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.047068740218877796, "PGD-Accuracy": 2.533333333333333, "PGD-Loss": 7.138355387369792}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 141, "Epoch-Time": 241.59557461738586, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.83999633789062, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1586, "Augmented-Loss": 0.07163915955555439, "Clean-Accuracy": 99.21, "Clean-Loss": 0.0524315576672554, "PGD-Accuracy": 2.85, "PGD-Loss": 6.9806340759277345}, "Total-Time": 32840.32265877724, "Train": {"Loss": 0.9379764024416606, "avg t": 0.9220127319229974, "plain loss": 0.08709362111621431, "standard loss": 0.0640214470271711}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.175, "Augmented-Loss": 0.06835200439969699, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05171924643715223, "PGD-Accuracy": 2.8666666666666667, "PGD-Loss": 6.997240859985352}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 142, "Epoch-Time": 241.34312653541565, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.57999420166016, "Augmented-0.05-Quantile-Accuracy": 98.29000091552734, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.078, "Augmented-Loss": 0.06130251371896267, "Clean-Accuracy": 99.14, "Clean-Loss": 0.046697146743536, "PGD-Accuracy": 1.04, "PGD-Loss": 7.993142687988281}, "Total-Time": 33081.66578531265, "Train": {"Loss": 0.9379561395468535, "avg t": 0.9220048714567114, "plain loss": 0.08656923043639574, "standard loss": 0.06264717966538888}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.174, "Augmented-Loss": 0.0573757400671641, "Clean-Accuracy": 99.25, "Clean-Loss": 0.044629177033901214, "PGD-Accuracy": 1.35, "PGD-Loss": 7.897911041259766}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 143, "Epoch-Time": 205.42927169799805, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97999572753906, "Augmented-0.05-Quantile-Accuracy": 98.54000091552734, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.1903, "Augmented-Loss": 0.06422263858306408, "Clean-Accuracy": 99.24, "Clean-Loss": 0.0495741815507412, "PGD-Accuracy": 1.96, "PGD-Loss": 7.867689599609375}, "Total-Time": 33287.09505701065, "Train": {"Loss": 0.9380518334353412, "avg t": 0.9220155941998517, "plain loss": 0.08901091531470963, "standard loss": 0.06478530067426187}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.2745, "Augmented-Loss": 0.061408793533643084, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.04834198827544848, "PGD-Accuracy": 2.1666666666666665, "PGD-Loss": 7.805210088094076}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 144, "Epoch-Time": 220.19801139831543, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.02999877929688, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1959, "Augmented-Loss": 0.06488658061659336, "Clean-Accuracy": 99.28, "Clean-Loss": 0.048127540123462674, "PGD-Accuracy": 1.54, "PGD-Loss": 7.512310980224609}, "Total-Time": 33507.293068408966, "Train": {"Loss": 0.9379550031026205, "avg t": 0.9219949216136226, "plain loss": 0.0833024217640912, "standard loss": 0.060111515758214176}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.29033333333334, "Augmented-Loss": 0.061752446356912453, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.046655330553650856, "PGD-Accuracy": 1.8666666666666667, "PGD-Loss": 7.430104537963867}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 145, "Epoch-Time": 241.43973994255066, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.7699966430664, "Augmented-Accuracy": 99.1727, "Augmented-Loss": 0.06126958061718941, "Clean-Accuracy": 99.22, "Clean-Loss": 0.0478668696463108, "PGD-Accuracy": 2.02, "PGD-Loss": 7.428269702148437}, "Total-Time": 33748.73280835152, "Train": {"Loss": 0.9379683101971944, "avg t": 0.9220112217973779, "plain loss": 0.08871237271980005, "standard loss": 0.06467756461434894}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.38333129882812, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.26933333333334, "Augmented-Loss": 0.057599311389227706, "Clean-Accuracy": 99.35, "Clean-Loss": 0.04573473945260048, "PGD-Accuracy": 2.033333333333333, "PGD-Loss": 7.263363835652669}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 146, "Epoch-Time": 241.42658853530884, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93000030517578, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.72000122070312, "Augmented-Accuracy": 99.1851, "Augmented-Loss": 0.07817267481136322, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05692318807840347, "PGD-Accuracy": 2.52, "PGD-Loss": 7.31049352722168}, "Total-Time": 33990.159396886826, "Train": {"Loss": 0.9379556482456348, "avg t": 0.9220026380221049, "plain loss": 0.08705190834822485, "standard loss": 0.06366885734266706}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2515, "Augmented-Loss": 0.07354514179805914, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.05430242525537809, "PGD-Accuracy": 2.816666666666667, "PGD-Loss": 7.250404591878255}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 147, "Epoch-Time": 241.37296414375305, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.02999877929688, "Augmented-0.05-Quantile-Accuracy": 98.58999633789062, "Augmented-0.1-Quantile-Accuracy": 98.7699966430664, "Augmented-Accuracy": 99.2134, "Augmented-Loss": 0.07282285472202302, "Clean-Accuracy": 99.3, "Clean-Loss": 0.054424093317985534, "PGD-Accuracy": 2.72, "PGD-Loss": 7.366193609619141}, "Total-Time": 34231.53236103058, "Train": {"Loss": 0.9379590178772256, "avg t": 0.9220036353535123, "plain loss": 0.08745628268630408, "standard loss": 0.06427416358170686}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.294, "Augmented-Loss": 0.06911072087248167, "Clean-Accuracy": 99.43333333333334, "Clean-Loss": 0.052478277305761975, "PGD-Accuracy": 2.7333333333333334, "PGD-Loss": 7.321167322794596}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 148, "Epoch-Time": 232.65810370445251, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.89999389648438, "Augmented-0.05-Quantile-Accuracy": 98.43999481201172, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1547, "Augmented-Loss": 0.0703887415009737, "Clean-Accuracy": 99.28, "Clean-Loss": 0.05093599659204483, "PGD-Accuracy": 2.82, "PGD-Loss": 7.156248825073242}, "Total-Time": 34464.19046473503, "Train": {"Loss": 0.9379827814631992, "avg t": 0.9220068817491884, "plain loss": 0.08562626693337042, "standard loss": 0.0608527205630585}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.75, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.29, "Augmented-Loss": 0.06501633814275265, "Clean-Accuracy": 99.35, "Clean-Loss": 0.04781607380509376, "PGD-Accuracy": 2.65, "PGD-Loss": 7.171486953735352}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 149, "Epoch-Time": 204.90416288375854, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1784, "Augmented-Loss": 0.06476621901130676, "Clean-Accuracy": 99.2, "Clean-Loss": 0.048685506069660184, "PGD-Accuracy": 1.76, "PGD-Loss": 7.838806146240234}, "Total-Time": 34669.09462761879, "Train": {"Loss": 0.9380187337663438, "avg t": 0.9220086663210834, "plain loss": 0.0862714258105666, "standard loss": 0.06087150379573857}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.25, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.28683333333333, "Augmented-Loss": 0.05946972439398368, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.045303273171186445, "PGD-Accuracy": 2.0833333333333335, "PGD-Loss": 7.7702013244628905}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.3, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_030", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.3, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
