{"Epoch": 0, "Epoch-Time": 218.52979469299316, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.89999389648438, "Augmented-0.05-Quantile-Accuracy": 97.07999420166016, "Augmented-0.1-Quantile-Accuracy": 97.54000091552734, "Augmented-Accuracy": 98.4488, "Augmented-Loss": 0.26845571141529084, "Clean-Accuracy": 98.58, "Clean-Loss": 0.169336186170578, "PGD-Accuracy": 2.68, "PGD-Loss": 3.691367337036133}, "Total-Time": 218.52979469299316, "Train": {"Loss": 3.5635492205796417, "avg t": 1.0490797872190123, "plain loss": 0.44711636331346233, "standard loss": 0.34682531806274697}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.06666564941406, "Augmented-0.05-Quantile-Accuracy": 97.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.06666564941406, "Augmented-Accuracy": 98.7375, "Augmented-Loss": 0.24426927277406058, "Clean-Accuracy": 98.88333333333334, "Clean-Loss": 0.15053836894035338, "PGD-Accuracy": 2.6, "PGD-Loss": 3.690020772298177}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 1, "Epoch-Time": 241.59543180465698, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.64999389648438, "Augmented-0.05-Quantile-Accuracy": 97.73999786376953, "Augmented-0.1-Quantile-Accuracy": 98.00999450683594, "Augmented-Accuracy": 98.806, "Augmented-Loss": 0.2626713198776245, "Clean-Accuracy": 98.94, "Clean-Loss": 0.12007319374084473, "PGD-Accuracy": 10.71, "PGD-Loss": 3.4560106674194335}, "Total-Time": 460.12522649765015, "Train": {"Loss": 1.6977652780744765, "avg t": 1.011212551470156, "plain loss": 0.3010939192242091, "standard loss": 0.18595473324369502}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.98332977294922, "Augmented-0.05-Quantile-Accuracy": 98.08333587646484, "Augmented-0.1-Quantile-Accuracy": 98.25, "Augmented-Accuracy": 98.79466666666667, "Augmented-Loss": 0.2518824669790268, "Clean-Accuracy": 98.9, "Clean-Loss": 0.116401229540507, "PGD-Accuracy": 10.033333333333333, "PGD-Loss": 3.3979432322184246}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 2, "Epoch-Time": 241.73766016960144, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.33999633789062, "Augmented-0.05-Quantile-Accuracy": 96.13999938964844, "Augmented-0.1-Quantile-Accuracy": 96.93999481201172, "Augmented-Accuracy": 98.2489, "Augmented-Loss": 0.5106782247695922, "Clean-Accuracy": 98.6, "Clean-Loss": 0.2671637702941895, "PGD-Accuracy": 10.86, "PGD-Loss": 3.318215852355957}, "Total-Time": 701.8628866672516, "Train": {"Loss": 1.5836250230294686, "avg t": 1.0082333366252758, "plain loss": 0.26323500554826557, "standard loss": 0.14981034557466152}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.21666717529297, "Augmented-0.05-Quantile-Accuracy": 96.86666870117188, "Augmented-0.1-Quantile-Accuracy": 97.53333282470703, "Augmented-Accuracy": 98.43733333333333, "Augmented-Loss": 0.4865304812844594, "Clean-Accuracy": 98.61666666666666, "Clean-Loss": 0.2518467937310537, "PGD-Accuracy": 10.05, "PGD-Loss": 3.247242073059082}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 3, "Epoch-Time": 241.7021369934082, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.22000122070312, "Augmented-0.05-Quantile-Accuracy": 97.36000061035156, "Augmented-0.1-Quantile-Accuracy": 97.79999542236328, "Augmented-Accuracy": 98.7391, "Augmented-Loss": 0.1576009935927391, "Clean-Accuracy": 98.79, "Clean-Loss": 0.07788771797418595, "PGD-Accuracy": 11.62, "PGD-Loss": 4.0136121536254885}, "Total-Time": 943.5650236606598, "Train": {"Loss": 1.5867979196972317, "avg t": 1.0071737784279717, "plain loss": 0.24508110865840219, "standard loss": 0.1396683950247588}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.88333129882812, "Augmented-0.05-Quantile-Accuracy": 97.9000015258789, "Augmented-0.1-Quantile-Accuracy": 98.26666259765625, "Augmented-Accuracy": 98.888, "Augmented-Loss": 0.14434080673853555, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.07265275600552559, "PGD-Accuracy": 11.05, "PGD-Loss": 3.9224499638875328}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 4, "Epoch-Time": 237.2263481616974, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.12999725341797, "Augmented-0.05-Quantile-Accuracy": 97.41999816894531, "Augmented-0.1-Quantile-Accuracy": 97.82999420166016, "Augmented-Accuracy": 98.7231, "Augmented-Loss": 0.14003421550512313, "Clean-Accuracy": 98.77, "Clean-Loss": 0.06783905166387558, "PGD-Accuracy": 14.36, "PGD-Loss": 3.7462462677001955}, "Total-Time": 1180.7913718223572, "Train": {"Loss": 1.5724321105391892, "avg t": 1.0069312532566213, "plain loss": 0.23758455247879035, "standard loss": 0.1308961537723188}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.08333587646484, "Augmented-0.05-Quantile-Accuracy": 97.98332977294922, "Augmented-0.1-Quantile-Accuracy": 98.38333129882812, "Augmented-Accuracy": 98.976, "Augmented-Loss": 0.12539182861407597, "Clean-Accuracy": 99.1, "Clean-Loss": 0.05953150999546051, "PGD-Accuracy": 13.783333333333333, "PGD-Loss": 3.686594876607259}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 5, "Epoch-Time": 199.77487325668335, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.11000061035156, "Augmented-0.05-Quantile-Accuracy": 97.40999603271484, "Augmented-0.1-Quantile-Accuracy": 97.86000061035156, "Augmented-Accuracy": 98.7235, "Augmented-Loss": 0.10229294928836823, "Clean-Accuracy": 98.73, "Clean-Loss": 0.05236051950454712, "PGD-Accuracy": 13.25, "PGD-Loss": 5.508297320556641}, "Total-Time": 1380.5662450790405, "Train": {"Loss": 1.5332357523176405, "avg t": 1.0054259485315393, "plain loss": 0.2225228628582423, "standard loss": 0.11089378015641813}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.93333435058594, "Augmented-0.05-Quantile-Accuracy": 97.98332977294922, "Augmented-0.1-Quantile-Accuracy": 98.26666259765625, "Augmented-Accuracy": 98.929, "Augmented-Loss": 0.09327824186682701, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.04913854312896729, "PGD-Accuracy": 12.816666666666666, "PGD-Loss": 5.392828687032064}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 6, "Epoch-Time": 229.32210755348206, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.87999725341797, "Augmented-0.05-Quantile-Accuracy": 97.3499984741211, "Augmented-0.1-Quantile-Accuracy": 97.75, "Augmented-Accuracy": 98.8635, "Augmented-Loss": 0.15078181380462646, "Clean-Accuracy": 98.8, "Clean-Loss": 0.06013021773099899, "PGD-Accuracy": 14.46, "PGD-Loss": 4.054336380004883}, "Total-Time": 1609.8883526325226, "Train": {"Loss": 1.5061064091435186, "avg t": 1.0047624164863869, "plain loss": 0.215977913934213, "standard loss": 0.10330720493970094}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.53333282470703, "Augmented-0.05-Quantile-Accuracy": 97.83333587646484, "Augmented-0.1-Quantile-Accuracy": 98.0999984741211, "Augmented-Accuracy": 98.93983333333334, "Augmented-Loss": 0.14050686935941378, "Clean-Accuracy": 98.98333333333333, "Clean-Loss": 0.05729417532682419, "PGD-Accuracy": 14.166666666666666, "PGD-Loss": 3.8892953186035157}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 7, "Epoch-Time": 241.5632176399231, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.82999420166016, "Augmented-0.05-Quantile-Accuracy": 97.30999755859375, "Augmented-0.1-Quantile-Accuracy": 97.86000061035156, "Augmented-Accuracy": 98.8273, "Augmented-Loss": 0.15231917682886123, "Clean-Accuracy": 99.0, "Clean-Loss": 0.06613808200359345, "PGD-Accuracy": 13.85, "PGD-Loss": 3.957826022338867}, "Total-Time": 1851.4515702724457, "Train": {"Loss": 1.4808844015333387, "avg t": 1.0042507460205643, "plain loss": 0.2110336993711964, "standard loss": 0.0988836818823108}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.78333282470703, "Augmented-0.05-Quantile-Accuracy": 98.04999542236328, "Augmented-0.1-Quantile-Accuracy": 98.36666870117188, "Augmented-Accuracy": 99.0225, "Augmented-Loss": 0.13913759384036065, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.0611988146007061, "PGD-Accuracy": 13.216666666666667, "PGD-Loss": 3.888002487182617}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 8, "Epoch-Time": 241.62177920341492, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.13999938964844, "Augmented-0.05-Quantile-Accuracy": 97.43000030517578, "Augmented-0.1-Quantile-Accuracy": 97.86000061035156, "Augmented-Accuracy": 98.8185, "Augmented-Loss": 0.11091123068284989, "Clean-Accuracy": 98.88, "Clean-Loss": 0.05335801336765289, "PGD-Accuracy": 13.67, "PGD-Loss": 4.354917092895508}, "Total-Time": 2093.0733494758606, "Train": {"Loss": 1.4310215356614855, "avg t": 1.0034832884117408, "plain loss": 0.20547908106909857, "standard loss": 0.09703988657615803}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.88333129882812, "Augmented-0.05-Quantile-Accuracy": 97.8499984741211, "Augmented-0.1-Quantile-Accuracy": 98.13333129882812, "Augmented-Accuracy": 98.95966666666666, "Augmented-Loss": 0.09923431545933088, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.04959977659086386, "PGD-Accuracy": 13.116666666666667, "PGD-Loss": 4.221735984802246}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 9, "Epoch-Time": 241.62713074684143, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.08999633789062, "Augmented-0.05-Quantile-Accuracy": 97.65999603271484, "Augmented-0.1-Quantile-Accuracy": 98.14999389648438, "Augmented-Accuracy": 98.9619, "Augmented-Loss": 0.12068484632277489, "Clean-Accuracy": 99.03, "Clean-Loss": 0.05037217360138893, "PGD-Accuracy": 12.56, "PGD-Loss": 3.518931491088867}, "Total-Time": 2334.700480222702, "Train": {"Loss": 1.4252333335876466, "avg t": 1.0030395673116048, "plain loss": 0.20015315198898329, "standard loss": 0.09288299042317602}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.46666717529297, "Augmented-Accuracy": 99.07616666666667, "Augmented-Loss": 0.11016567499955496, "Clean-Accuracy": 99.15, "Clean-Loss": 0.046866778547565144, "PGD-Accuracy": 12.333333333333334, "PGD-Loss": 3.375084243774414}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 10, "Epoch-Time": 207.16948056221008, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.13999938964844, "Augmented-0.05-Quantile-Accuracy": 97.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.08999633789062, "Augmented-Accuracy": 98.8926, "Augmented-Loss": 0.10471007509732247, "Clean-Accuracy": 98.99, "Clean-Loss": 0.04589563218951225, "PGD-Accuracy": 14.16, "PGD-Loss": 4.351941404724121}, "Total-Time": 2541.869960784912, "Train": {"Loss": 1.4054847329104387, "avg t": 1.0026571407318114, "plain loss": 0.19326152912422467, "standard loss": 0.08964121092690362}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.26666259765625, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 99.16683333333333, "Augmented-Loss": 0.09284228423058986, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.0416850338379542, "PGD-Accuracy": 14.183333333333334, "PGD-Loss": 4.200359972635905}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 11, "Epoch-Time": 220.80827856063843, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.22000122070312, "Augmented-0.05-Quantile-Accuracy": 97.66999816894531, "Augmented-0.1-Quantile-Accuracy": 98.12999725341797, "Augmented-Accuracy": 98.9664, "Augmented-Loss": 0.12341452118206024, "Clean-Accuracy": 99.08, "Clean-Loss": 0.04897654021978378, "PGD-Accuracy": 12.96, "PGD-Loss": 3.4145937591552733}, "Total-Time": 2762.6782393455505, "Train": {"Loss": 1.398948795106676, "avg t": 1.0021854971779718, "plain loss": 0.18589128246660602, "standard loss": 0.08618573151252888}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.08333587646484, "Augmented-0.1-Quantile-Accuracy": 98.33333587646484, "Augmented-Accuracy": 99.058, "Augmented-Loss": 0.11452628421386082, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.04756483524044355, "PGD-Accuracy": 12.566666666666666, "PGD-Loss": 3.3116400044759113}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 12, "Epoch-Time": 241.63658261299133, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.7699966430664, "Augmented-0.05-Quantile-Accuracy": 97.16999816894531, "Augmented-0.1-Quantile-Accuracy": 97.6199951171875, "Augmented-Accuracy": 98.6403, "Augmented-Loss": 0.13940375094509125, "Clean-Accuracy": 98.91, "Clean-Loss": 0.05766257210969925, "PGD-Accuracy": 14.36, "PGD-Loss": 3.67677451171875}, "Total-Time": 3004.314821958542, "Train": {"Loss": 1.400717759097064, "avg t": 1.0020822948879666, "plain loss": 0.1789302764327437, "standard loss": 0.08034465043633073}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.75, "Augmented-0.05-Quantile-Accuracy": 97.94999694824219, "Augmented-0.1-Quantile-Accuracy": 98.19999694824219, "Augmented-Accuracy": 98.97633333333333, "Augmented-Loss": 0.12572250824491182, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.05161434672276179, "PGD-Accuracy": 14.283333333333333, "PGD-Loss": 3.569999651590983}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 13, "Epoch-Time": 241.6837067604065, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.80999755859375, "Augmented-0.05-Quantile-Accuracy": 97.22999572753906, "Augmented-0.1-Quantile-Accuracy": 97.79000091552734, "Augmented-Accuracy": 98.8076, "Augmented-Loss": 0.1648371264986992, "Clean-Accuracy": 99.04, "Clean-Loss": 0.05986345920562744, "PGD-Accuracy": 12.0, "PGD-Loss": 3.175173492431641}, "Total-Time": 3245.9985287189484, "Train": {"Loss": 1.4323149137850162, "avg t": 1.0021528967751396, "plain loss": 0.17562265889556322, "standard loss": 0.07845600294846075}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.86666870117188, "Augmented-0.05-Quantile-Accuracy": 98.08333587646484, "Augmented-0.1-Quantile-Accuracy": 98.41666412353516, "Augmented-Accuracy": 99.01516666666667, "Augmented-Loss": 0.14818469606637955, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.05433333430687586, "PGD-Accuracy": 11.433333333333334, "PGD-Loss": 3.0787069040934245}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 14, "Epoch-Time": 241.47821497917175, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.77999877929688, "Augmented-0.05-Quantile-Accuracy": 96.18999481201172, "Augmented-0.1-Quantile-Accuracy": 96.97000122070312, "Augmented-Accuracy": 98.5167, "Augmented-Loss": 0.27602439311218263, "Clean-Accuracy": 98.9, "Clean-Loss": 0.12596585018634796, "PGD-Accuracy": 13.61, "PGD-Loss": 3.0574666534423827}, "Total-Time": 3487.47674369812, "Train": {"Loss": 1.4046409026958324, "avg t": 1.0015529256750035, "plain loss": 0.1677848303335685, "standard loss": 0.07627314429040308}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.19999694824219, "Augmented-0.05-Quantile-Accuracy": 97.18333435058594, "Augmented-0.1-Quantile-Accuracy": 97.73332977294922, "Augmented-Accuracy": 98.8055, "Augmented-Loss": 0.24777937654018403, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.11112840672334036, "PGD-Accuracy": 12.916666666666666, "PGD-Loss": 2.9534920908610025}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 15, "Epoch-Time": 237.71947169303894, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.52999877929688, "Augmented-0.05-Quantile-Accuracy": 97.68000030517578, "Augmented-0.1-Quantile-Accuracy": 98.02999877929688, "Augmented-Accuracy": 98.9264, "Augmented-Loss": 0.08920112514162064, "Clean-Accuracy": 99.03, "Clean-Loss": 0.03912561593949795, "PGD-Accuracy": 12.42, "PGD-Loss": 3.522234378051758}, "Total-Time": 3725.196215391159, "Train": {"Loss": 1.4614192864100137, "avg t": 1.0017435121536256, "plain loss": 0.16544804121653256, "standard loss": 0.07446356068717108}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.16666412353516, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 99.11416666666666, "Augmented-Loss": 0.08146023215095202, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.0387780382335186, "PGD-Accuracy": 11.983333333333333, "PGD-Loss": 3.425309356689453}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 16, "Epoch-Time": 201.99953651428223, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.23999786376953, "Augmented-0.05-Quantile-Accuracy": 97.56999969482422, "Augmented-0.1-Quantile-Accuracy": 98.11000061035156, "Augmented-Accuracy": 98.9717, "Augmented-Loss": 0.0949304657831192, "Clean-Accuracy": 99.11, "Clean-Loss": 0.039803219646215436, "PGD-Accuracy": 12.83, "PGD-Loss": 5.012728237915039}, "Total-Time": 3927.1957519054413, "Train": {"Loss": 1.4104613127531829, "avg t": 1.0014028967398185, "plain loss": 0.15923492953689028, "standard loss": 0.06881254043623253}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.83333587646484, "Augmented-0.05-Quantile-Accuracy": 97.9000015258789, "Augmented-0.1-Quantile-Accuracy": 98.23332977294922, "Augmented-Accuracy": 98.958, "Augmented-Loss": 0.09307767607072989, "Clean-Accuracy": 99.05, "Clean-Loss": 0.04331935283044974, "PGD-Accuracy": 12.35, "PGD-Loss": 4.727952878316244}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 17, "Epoch-Time": 230.47972559928894, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.41999816894531, "Augmented-0.05-Quantile-Accuracy": 97.75999450683594, "Augmented-0.1-Quantile-Accuracy": 98.05999755859375, "Augmented-Accuracy": 98.9358, "Augmented-Loss": 0.11991538025546074, "Clean-Accuracy": 99.04, "Clean-Loss": 0.046645696538686755, "PGD-Accuracy": 14.06, "PGD-Loss": 3.815874028015137}, "Total-Time": 4157.67547750473, "Train": {"Loss": 1.3974269206435592, "avg t": 1.001249106230559, "plain loss": 0.158969578711192, "standard loss": 0.06686741465330123}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.26666259765625, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 99.14783333333334, "Augmented-Loss": 0.10530969633817673, "Clean-Accuracy": 99.15, "Clean-Loss": 0.04263721989095211, "PGD-Accuracy": 13.083333333333334, "PGD-Loss": 3.7139795532226563}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 18, "Epoch-Time": 241.4755563735962, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.45999908447266, "Augmented-0.05-Quantile-Accuracy": 97.68999481201172, "Augmented-0.1-Quantile-Accuracy": 98.13999938964844, "Augmented-Accuracy": 98.9607, "Augmented-Loss": 0.06983993261241912, "Clean-Accuracy": 99.04, "Clean-Loss": 0.037213920852541924, "PGD-Accuracy": 12.57, "PGD-Loss": 5.037821952819824}, "Total-Time": 4399.151033878326, "Train": {"Loss": 1.412529669655694, "avg t": 1.0013943127172964, "plain loss": 0.15823966245474638, "standard loss": 0.06525279096541581}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.06666564941406, "Augmented-0.05-Quantile-Accuracy": 98.0, "Augmented-0.1-Quantile-Accuracy": 98.4000015258789, "Augmented-Accuracy": 99.0355, "Augmented-Loss": 0.0641812701305747, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.03832309038440387, "PGD-Accuracy": 11.866666666666667, "PGD-Loss": 4.902281664530436}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 19, "Epoch-Time": 241.6067419052124, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.61000061035156, "Augmented-0.05-Quantile-Accuracy": 97.7699966430664, "Augmented-0.1-Quantile-Accuracy": 98.11000061035156, "Augmented-Accuracy": 98.9696, "Augmented-Loss": 0.09295130310034752, "Clean-Accuracy": 99.0, "Clean-Loss": 0.04205351659655571, "PGD-Accuracy": 13.27, "PGD-Loss": 4.143867301940918}, "Total-Time": 4640.757775783539, "Train": {"Loss": 1.4633410540686713, "avg t": 1.0019139886255617, "plain loss": 0.15672678114219962, "standard loss": 0.06581975848807228}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.11666870117188, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 99.0435, "Augmented-Loss": 0.08509822744210561, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.041159862654904525, "PGD-Accuracy": 12.416666666666666, "PGD-Loss": 3.921408401489258}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 20, "Epoch-Time": 241.90077328681946, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.40999603271484, "Augmented-0.05-Quantile-Accuracy": 97.72000122070312, "Augmented-0.1-Quantile-Accuracy": 98.0999984741211, "Augmented-Accuracy": 99.009, "Augmented-Loss": 0.07673517788302898, "Clean-Accuracy": 99.12, "Clean-Loss": 0.03570026960372925, "PGD-Accuracy": 12.48, "PGD-Loss": 4.84165344543457}, "Total-Time": 4882.658549070358, "Train": {"Loss": 1.5364671856562298, "avg t": 1.0024790445257117, "plain loss": 0.15115236847842187, "standard loss": 0.0656954720467329}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.76666259765625, "Augmented-0.05-Quantile-Accuracy": 98.01666259765625, "Augmented-0.1-Quantile-Accuracy": 98.43333435058594, "Augmented-Accuracy": 99.03933333333333, "Augmented-Loss": 0.07100551339824994, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.03898833546290795, "PGD-Accuracy": 12.1, "PGD-Loss": 4.6460953699747725}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 21, "Epoch-Time": 207.3285310268402, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.33999633789062, "Augmented-0.05-Quantile-Accuracy": 97.41999816894531, "Augmented-0.1-Quantile-Accuracy": 97.81999969482422, "Augmented-Accuracy": 98.8086, "Augmented-Loss": 0.0658165572808981, "Clean-Accuracy": 98.99, "Clean-Loss": 0.03614020645469427, "PGD-Accuracy": 13.05, "PGD-Loss": 4.588124015808106}, "Total-Time": 5089.9870800971985, "Train": {"Loss": 1.4401354242960611, "avg t": 1.001461924535257, "plain loss": 0.15018257589516815, "standard loss": 0.06294404430135532}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.91666412353516, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.51666259765625, "Augmented-Accuracy": 99.11383333333333, "Augmented-Loss": 0.058187424910366534, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.03546779491007328, "PGD-Accuracy": 13.4, "PGD-Loss": 4.338494318644206}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 22, "Epoch-Time": 219.65609574317932, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.55999755859375, "Augmented-0.05-Quantile-Accuracy": 97.72999572753906, "Augmented-0.1-Quantile-Accuracy": 98.13999938964844, "Augmented-Accuracy": 98.9742, "Augmented-Loss": 0.038392849035426974, "Clean-Accuracy": 99.04, "Clean-Loss": 0.030435096732154488, "PGD-Accuracy": 12.05, "PGD-Loss": 5.787392553710937}, "Total-Time": 5309.643175840378, "Train": {"Loss": 1.7589125772758767, "avg t": 1.00356792389905, "plain loss": 0.15052427513864314, "standard loss": 0.06248455386526055}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.08333587646484, "Augmented-0.1-Quantile-Accuracy": 98.31666564941406, "Augmented-Accuracy": 99.00933333333333, "Augmented-Loss": 0.038943891370315106, "Clean-Accuracy": 98.98333333333333, "Clean-Loss": 0.0353015587029513, "PGD-Accuracy": 11.633333333333333, "PGD-Loss": 5.5031996332804365}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 23, "Epoch-Time": 241.64514303207397, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.11000061035156, "Augmented-0.05-Quantile-Accuracy": 97.13999938964844, "Augmented-0.1-Quantile-Accuracy": 97.77999877929688, "Augmented-Accuracy": 98.809, "Augmented-Loss": 0.13688440649461747, "Clean-Accuracy": 99.09, "Clean-Loss": 0.0521693941950798, "PGD-Accuracy": 10.79, "PGD-Loss": 4.011820634460449}, "Total-Time": 5551.288318872452, "Train": {"Loss": 1.5480787222120498, "avg t": 1.0017667085506299, "plain loss": 0.1416966072947891, "standard loss": 0.06030044703985806}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.11666870117188, "Augmented-0.05-Quantile-Accuracy": 97.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.0999984741211, "Augmented-Accuracy": 98.91933333333333, "Augmented-Loss": 0.1258896619606018, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.0497902908573548, "PGD-Accuracy": 10.033333333333333, "PGD-Loss": 3.7783942616780597}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 24, "Epoch-Time": 241.7839252948761, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.07999420166016, "Augmented-0.05-Quantile-Accuracy": 96.93999481201172, "Augmented-0.1-Quantile-Accuracy": 97.56999969482422, "Augmented-Accuracy": 98.6642, "Augmented-Loss": 0.12455120166349411, "Clean-Accuracy": 98.84, "Clean-Loss": 0.05757155941724777, "PGD-Accuracy": 13.22, "PGD-Loss": 3.7960740844726564}, "Total-Time": 5793.072244167328, "Train": {"Loss": 1.487651990396005, "avg t": 1.0013401075292516, "plain loss": 0.1424150995607728, "standard loss": 0.06204537890272008}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.5999984741211, "Augmented-0.05-Quantile-Accuracy": 97.29999542236328, "Augmented-0.1-Quantile-Accuracy": 97.91666412353516, "Augmented-Accuracy": 98.80183333333333, "Augmented-Loss": 0.11621215208053588, "Clean-Accuracy": 98.85, "Clean-Loss": 0.056730573847889904, "PGD-Accuracy": 12.383333333333333, "PGD-Loss": 3.5966788686116535}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 25, "Epoch-Time": 241.65413522720337, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.16999816894531, "Augmented-0.05-Quantile-Accuracy": 97.22999572753906, "Augmented-0.1-Quantile-Accuracy": 97.7699966430664, "Augmented-Accuracy": 98.854, "Augmented-Loss": 0.1918970473279953, "Clean-Accuracy": 99.1, "Clean-Loss": 0.06134332585334778, "PGD-Accuracy": 11.9, "PGD-Loss": 3.191462385559082}, "Total-Time": 6034.726379394531, "Train": {"Loss": 1.5098583018338239, "avg t": 1.0014900881625988, "plain loss": 0.14110689104044882, "standard loss": 0.05978365415941786}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.1500015258789, "Augmented-0.05-Quantile-Accuracy": 97.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.23332977294922, "Augmented-Accuracy": 99.02183333333333, "Augmented-Loss": 0.18208457895596822, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05996541462341944, "PGD-Accuracy": 11.183333333333334, "PGD-Loss": 3.1015350914001463}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 26, "Epoch-Time": 236.68529272079468, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.75999450683594, "Augmented-0.05-Quantile-Accuracy": 97.15999603271484, "Augmented-0.1-Quantile-Accuracy": 97.73999786376953, "Augmented-Accuracy": 98.7987, "Augmented-Loss": 0.08659342157411576, "Clean-Accuracy": 99.04, "Clean-Loss": 0.04003101763725281, "PGD-Accuracy": 12.24, "PGD-Loss": 3.699535531616211}, "Total-Time": 6271.411672115326, "Train": {"Loss": 1.4374341731954503, "avg t": 1.001006291883963, "plain loss": 0.14182053608364528, "standard loss": 0.05815748967506267}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.71666717529297, "Augmented-0.05-Quantile-Accuracy": 97.94999694824219, "Augmented-0.1-Quantile-Accuracy": 98.3499984741211, "Augmented-Accuracy": 98.99466666666666, "Augmented-Loss": 0.0800299415063858, "Clean-Accuracy": 99.15, "Clean-Loss": 0.04090218766157826, "PGD-Accuracy": 11.566666666666666, "PGD-Loss": 3.573356997172038}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 27, "Epoch-Time": 202.15277862548828, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.12999725341797, "Augmented-0.05-Quantile-Accuracy": 97.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.00999450683594, "Augmented-Accuracy": 98.9152, "Augmented-Loss": 0.09581834017920494, "Clean-Accuracy": 99.06, "Clean-Loss": 0.0421035539150238, "PGD-Accuracy": 12.76, "PGD-Loss": 3.3608261428833006}, "Total-Time": 6473.564450740814, "Train": {"Loss": 1.5141003817805538, "avg t": 1.001344495932261, "plain loss": 0.14332583968551066, "standard loss": 0.0594241896448312}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.28333282470703, "Augmented-0.1-Quantile-Accuracy": 98.53333282470703, "Augmented-Accuracy": 99.08233333333334, "Augmented-Loss": 0.08498846487661203, "Clean-Accuracy": 99.1, "Clean-Loss": 0.03992403193563223, "PGD-Accuracy": 12.35, "PGD-Loss": 3.219494302113851}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 28, "Epoch-Time": 230.47045135498047, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.82999420166016, "Augmented-0.05-Quantile-Accuracy": 97.40999603271484, "Augmented-0.1-Quantile-Accuracy": 97.86000061035156, "Augmented-Accuracy": 98.8214, "Augmented-Loss": 0.0639720558463335, "Clean-Accuracy": 98.92, "Clean-Loss": 0.03908645658791065, "PGD-Accuracy": 11.37, "PGD-Loss": 4.664555184936524}, "Total-Time": 6704.034902095795, "Train": {"Loss": 1.55247481141267, "avg t": 1.0021561761785436, "plain loss": 0.1380806030114492, "standard loss": 0.056303681876234433}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.5999984741211, "Augmented-0.05-Quantile-Accuracy": 97.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.01666259765625, "Augmented-Accuracy": 98.86116666666666, "Augmented-Loss": 0.06035643928622206, "Clean-Accuracy": 98.93333333333334, "Clean-Loss": 0.04073352459445596, "PGD-Accuracy": 11.033333333333333, "PGD-Loss": 4.431895464579265}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 29, "Epoch-Time": 241.5722029209137, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.69999694824219, "Augmented-0.05-Quantile-Accuracy": 97.36000061035156, "Augmented-0.1-Quantile-Accuracy": 97.93000030517578, "Augmented-Accuracy": 98.8925, "Augmented-Loss": 0.1519237434644699, "Clean-Accuracy": 99.08, "Clean-Loss": 0.05523868792057037, "PGD-Accuracy": 12.18, "PGD-Loss": 3.357554846191406}, "Total-Time": 6945.607105016708, "Train": {"Loss": 1.4758405324088202, "avg t": 1.001174212385107, "plain loss": 0.13950444644292195, "standard loss": 0.05819993662420246}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.43333435058594, "Augmented-0.05-Quantile-Accuracy": 97.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.26666259765625, "Augmented-Accuracy": 99.005, "Augmented-Loss": 0.14083647129972776, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.053359514365593594, "PGD-Accuracy": 11.716666666666667, "PGD-Loss": 3.229519371032715}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 30, "Epoch-Time": 241.77016067504883, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.97999572753906, "Augmented-0.05-Quantile-Accuracy": 97.43999481201172, "Augmented-0.1-Quantile-Accuracy": 98.00999450683594, "Augmented-Accuracy": 98.9711, "Augmented-Loss": 0.10023046727085114, "Clean-Accuracy": 99.14, "Clean-Loss": 0.03858665090799332, "PGD-Accuracy": 12.81, "PGD-Loss": 3.6600548004150393}, "Total-Time": 7187.377265691757, "Train": {"Loss": 1.4670547968899763, "avg t": 1.000965348596926, "plain loss": 0.13624613978774464, "standard loss": 0.05554222775940542}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.93333435058594, "Augmented-0.05-Quantile-Accuracy": 98.08333587646484, "Augmented-0.1-Quantile-Accuracy": 98.48332977294922, "Augmented-Accuracy": 99.05266666666667, "Augmented-Loss": 0.08653519219418367, "Clean-Accuracy": 99.2, "Clean-Loss": 0.03716205638522903, "PGD-Accuracy": 12.133333333333333, "PGD-Loss": 3.5106810251871745}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 31, "Epoch-Time": 241.43443655967712, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.58999633789062, "Augmented-0.05-Quantile-Accuracy": 97.80999755859375, "Augmented-0.1-Quantile-Accuracy": 98.16999816894531, "Augmented-Accuracy": 98.9401, "Augmented-Loss": 0.036344101970799264, "Clean-Accuracy": 99.04, "Clean-Loss": 0.03274218292930164, "PGD-Accuracy": 11.66, "PGD-Loss": 6.484388217163086}, "Total-Time": 7428.811702251434, "Train": {"Loss": 1.44812289569996, "avg t": 1.0009490002526178, "plain loss": 0.1378293480166681, "standard loss": 0.05904052052564091}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.06666564941406, "Augmented-0.1-Quantile-Accuracy": 98.43333435058594, "Augmented-Accuracy": 99.07, "Augmented-Loss": 0.037390989215032505, "Clean-Accuracy": 99.15, "Clean-Loss": 0.036751674087912155, "PGD-Accuracy": 11.35, "PGD-Loss": 6.174851666768392}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 32, "Epoch-Time": 207.0374138355255, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.02999877929688, "Augmented-0.05-Quantile-Accuracy": 97.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.05999755859375, "Augmented-Accuracy": 98.9286, "Augmented-Loss": 0.09671623822522163, "Clean-Accuracy": 99.0, "Clean-Loss": 0.041615320992469784, "PGD-Accuracy": 12.44, "PGD-Loss": 3.5037808868408202}, "Total-Time": 7635.84911608696, "Train": {"Loss": 1.5236214189176207, "avg t": 1.001662686559889, "plain loss": 0.13727542936537, "standard loss": 0.054108620689422994}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.8499984741211, "Augmented-0.05-Quantile-Accuracy": 98.04999542236328, "Augmented-0.1-Quantile-Accuracy": 98.29999542236328, "Augmented-Accuracy": 98.97233333333334, "Augmented-Loss": 0.08843072484751542, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.04260680206120014, "PGD-Accuracy": 11.416666666666666, "PGD-Loss": 3.3057927436828614}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 33, "Epoch-Time": 220.12091398239136, "Test": {"Augmented-0.01-Quantile-Accuracy": 91.25, "Augmented-0.05-Quantile-Accuracy": 94.89999389648438, "Augmented-0.1-Quantile-Accuracy": 95.98999786376953, "Augmented-Accuracy": 97.9393, "Augmented-Loss": 0.3298140878763199, "Clean-Accuracy": 98.85, "Clean-Loss": 0.0888214634180069, "PGD-Accuracy": 11.31, "PGD-Loss": 3.030428726196289}, "Total-Time": 7855.970030069351, "Train": {"Loss": 1.6006586356692845, "avg t": 1.0021790349041975, "plain loss": 0.13899677763691665, "standard loss": 0.05522344582996987}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 92.71666717529297, "Augmented-0.05-Quantile-Accuracy": 95.86666870117188, "Augmented-0.1-Quantile-Accuracy": 96.68333435058594, "Augmented-Accuracy": 98.2625, "Augmented-Loss": 0.29427419939517974, "Clean-Accuracy": 98.95, "Clean-Loss": 0.08154010647535324, "PGD-Accuracy": 10.5, "PGD-Loss": 3.0035026156107585}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 34, "Epoch-Time": 241.50018858909607, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.25999450683594, "Augmented-0.05-Quantile-Accuracy": 97.61000061035156, "Augmented-0.1-Quantile-Accuracy": 98.05999755859375, "Augmented-Accuracy": 98.9537, "Augmented-Loss": 0.07917438000488282, "Clean-Accuracy": 99.01, "Clean-Loss": 0.037115799510478976, "PGD-Accuracy": 12.61, "PGD-Loss": 3.7750227630615236}, "Total-Time": 8097.470218658447, "Train": {"Loss": 2.261946212132772, "avg t": 1.0043378891061854, "plain loss": 0.1409138614195364, "standard loss": 0.0621791377166907}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.08333587646484, "Augmented-0.1-Quantile-Accuracy": 98.43333435058594, "Augmented-Accuracy": 99.11033333333333, "Augmented-Loss": 0.07422742226243019, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.03962183917313814, "PGD-Accuracy": 12.283333333333333, "PGD-Loss": 3.61950124613444}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 35, "Epoch-Time": 241.52469611167908, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.91999816894531, "Augmented-0.05-Quantile-Accuracy": 96.8499984741211, "Augmented-0.1-Quantile-Accuracy": 97.41999816894531, "Augmented-Accuracy": 98.6742, "Augmented-Loss": 0.08915064302825927, "Clean-Accuracy": 98.8, "Clean-Loss": 0.043488765344023704, "PGD-Accuracy": 11.33, "PGD-Loss": 4.80838268737793}, "Total-Time": 8338.994914770126, "Train": {"Loss": 1.505929201832524, "avg t": 1.0011497621536254, "plain loss": 0.1337359538555146, "standard loss": 0.05367255337136211}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.06666564941406, "Augmented-0.05-Quantile-Accuracy": 97.75, "Augmented-0.1-Quantile-Accuracy": 98.1500015258789, "Augmented-Accuracy": 98.93766666666667, "Augmented-Loss": 0.0785771899207433, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.041897938355803487, "PGD-Accuracy": 10.75, "PGD-Loss": 4.471152692159017}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 36, "Epoch-Time": 241.51545119285583, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.38999938964844, "Augmented-0.05-Quantile-Accuracy": 97.75, "Augmented-0.1-Quantile-Accuracy": 98.20999908447266, "Augmented-Accuracy": 99.0763, "Augmented-Loss": 0.06125278523910046, "Clean-Accuracy": 99.2, "Clean-Loss": 0.031545739313960076, "PGD-Accuracy": 12.68, "PGD-Loss": 4.0027298202514645}, "Total-Time": 8580.510365962982, "Train": {"Loss": 1.5592022956565574, "avg t": 1.0016074685167384, "plain loss": 0.13158518586688558, "standard loss": 0.05418991705237163}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.03333282470703, "Augmented-0.05-Quantile-Accuracy": 98.03333282470703, "Augmented-0.1-Quantile-Accuracy": 98.3499984741211, "Augmented-Accuracy": 98.99433333333333, "Augmented-Loss": 0.059957837169667086, "Clean-Accuracy": 99.0, "Clean-Loss": 0.03786506205424666, "PGD-Accuracy": 12.4, "PGD-Loss": 3.8567454045613605}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 37, "Epoch-Time": 236.5745825767517, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.87999725341797, "Augmented-0.05-Quantile-Accuracy": 97.41999816894531, "Augmented-0.1-Quantile-Accuracy": 97.93000030517578, "Augmented-Accuracy": 98.9369, "Augmented-Loss": 0.11997486542844772, "Clean-Accuracy": 99.18, "Clean-Loss": 0.042288026112318036, "PGD-Accuracy": 11.96, "PGD-Loss": 3.3775164047241213}, "Total-Time": 8817.084948539734, "Train": {"Loss": 1.6385215093824599, "avg t": 1.0013429527635929, "plain loss": 0.1327789942547126, "standard loss": 0.05390437509091916}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.38333129882812, "Augmented-0.05-Quantile-Accuracy": 97.75, "Augmented-0.1-Quantile-Accuracy": 98.41666412353516, "Augmented-Accuracy": 99.03733333333334, "Augmented-Loss": 0.11205788364529609, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.043432061158120636, "PGD-Accuracy": 11.333333333333334, "PGD-Loss": 3.23285525004069}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 38, "Epoch-Time": 203.1680452823639, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.32999420166016, "Augmented-0.05-Quantile-Accuracy": 97.61000061035156, "Augmented-0.1-Quantile-Accuracy": 98.06999969482422, "Augmented-Accuracy": 98.9875, "Augmented-Loss": 0.06693503566777706, "Clean-Accuracy": 99.05, "Clean-Loss": 0.033627483174204824, "PGD-Accuracy": 12.42, "PGD-Loss": 4.432631900024414}, "Total-Time": 9020.252993822098, "Train": {"Loss": 1.6258879246888338, "avg t": 1.001550659109045, "plain loss": 0.133133658506252, "standard loss": 0.05358511424754505}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.06666564941406, "Augmented-0.05-Quantile-Accuracy": 98.03333282470703, "Augmented-0.1-Quantile-Accuracy": 98.3499984741211, "Augmented-Accuracy": 99.02583333333334, "Augmented-Loss": 0.06420358017727733, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.04049066848183672, "PGD-Accuracy": 12.133333333333333, "PGD-Loss": 4.163437578837077}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 39, "Epoch-Time": 231.44935512542725, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.3699951171875, "Augmented-0.05-Quantile-Accuracy": 97.50999450683594, "Augmented-0.1-Quantile-Accuracy": 98.04000091552734, "Augmented-Accuracy": 98.8816, "Augmented-Loss": 0.03702064579003956, "Clean-Accuracy": 99.02, "Clean-Loss": 0.03792011898534838, "PGD-Accuracy": 11.29, "PGD-Loss": 8.585773303222656}, "Total-Time": 9251.702348947525, "Train": {"Loss": 2.2783117502707024, "avg t": 1.0046507749204283, "plain loss": 0.14322551581329782, "standard loss": 0.05853772961269823}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.06666564941406, "Augmented-0.1-Quantile-Accuracy": 98.46666717529297, "Augmented-Accuracy": 99.08, "Augmented-Loss": 0.037976810827072674, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.04234472675735621, "PGD-Accuracy": 10.966666666666667, "PGD-Loss": 8.164086761474609}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 40, "Epoch-Time": 241.32549953460693, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.38999938964844, "Augmented-0.05-Quantile-Accuracy": 97.16999816894531, "Augmented-0.1-Quantile-Accuracy": 97.87999725341797, "Augmented-Accuracy": 98.9147, "Augmented-Loss": 0.0932656047796011, "Clean-Accuracy": 99.14, "Clean-Loss": 0.03282912103831768, "PGD-Accuracy": 10.99, "PGD-Loss": 3.928808491516113}, "Total-Time": 9493.027848482132, "Train": {"Loss": 1.6995187690876148, "avg t": 1.0026967335806953, "plain loss": 0.12751654370096008, "standard loss": 0.047009543970641166}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.33333587646484, "Augmented-0.05-Quantile-Accuracy": 97.86666870117188, "Augmented-0.1-Quantile-Accuracy": 98.38333129882812, "Augmented-Accuracy": 99.0115, "Augmented-Loss": 0.08384356664478779, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.03813936120582124, "PGD-Accuracy": 10.316666666666666, "PGD-Loss": 3.8016859486897787}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 41, "Epoch-Time": 241.67834782600403, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.18999481201172, "Augmented-0.05-Quantile-Accuracy": 95.93000030517578, "Augmented-0.1-Quantile-Accuracy": 96.75, "Augmented-Accuracy": 98.3731, "Augmented-Loss": 0.11578323647117615, "Clean-Accuracy": 98.8, "Clean-Loss": 0.040666355794295665, "PGD-Accuracy": 10.93, "PGD-Loss": 4.58654309387207}, "Total-Time": 9734.706196308136, "Train": {"Loss": 1.6327388134002685, "avg t": 1.0017228717803954, "plain loss": 0.12491268785441369, "standard loss": 0.04920768570748192}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.44999694824219, "Augmented-0.05-Quantile-Accuracy": 96.76666259765625, "Augmented-0.1-Quantile-Accuracy": 97.46666717529297, "Augmented-Accuracy": 98.56466666666667, "Augmented-Loss": 0.10275254578282436, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.04886304173540945, "PGD-Accuracy": 10.2, "PGD-Loss": 4.416134788513183}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 42, "Epoch-Time": 241.5658392906189, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.47999572753906, "Augmented-0.05-Quantile-Accuracy": 97.32999420166016, "Augmented-0.1-Quantile-Accuracy": 97.89999389648438, "Augmented-Accuracy": 98.8628, "Augmented-Loss": 0.06794315631812811, "Clean-Accuracy": 99.03, "Clean-Loss": 0.03523583184853196, "PGD-Accuracy": 10.98, "PGD-Loss": 5.1021349609375}, "Total-Time": 9976.272035598755, "Train": {"Loss": 1.6878388349391795, "avg t": 1.001440174985815, "plain loss": 0.12755784870606876, "standard loss": 0.04912754306562797}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.33333587646484, "Augmented-0.05-Quantile-Accuracy": 97.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.13333129882812, "Augmented-Accuracy": 99.002, "Augmented-Loss": 0.06304190792431434, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.04009278121155997, "PGD-Accuracy": 10.45, "PGD-Loss": 4.916806948343913}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 43, "Epoch-Time": 206.8663318157196, "Test": {"Augmented-0.01-Quantile-Accuracy": 88.79999542236328, "Augmented-0.05-Quantile-Accuracy": 93.54999542236328, "Augmented-0.1-Quantile-Accuracy": 94.89999389648438, "Augmented-Accuracy": 97.3977, "Augmented-Loss": 0.30521562478256226, "Clean-Accuracy": 98.79, "Clean-Loss": 0.08161801598072052, "PGD-Accuracy": 11.62, "PGD-Loss": 3.4596622543334963}, "Total-Time": 10183.138367414474, "Train": {"Loss": 1.5968571686921296, "avg t": 1.001780500906485, "plain loss": 0.12989914510426695, "standard loss": 0.05055715450837656}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 90.71666717529297, "Augmented-0.05-Quantile-Accuracy": 94.71666717529297, "Augmented-0.1-Quantile-Accuracy": 95.93333435058594, "Augmented-Accuracy": 97.94016666666667, "Augmented-Loss": 0.2570349208732446, "Clean-Accuracy": 98.95, "Clean-Loss": 0.07151611866056919, "PGD-Accuracy": 10.566666666666666, "PGD-Loss": 3.424663879394531}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 44, "Epoch-Time": 219.98006176948547, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.83999633789062, "Augmented-0.05-Quantile-Accuracy": 97.48999786376953, "Augmented-0.1-Quantile-Accuracy": 97.90999603271484, "Augmented-Accuracy": 98.9403, "Augmented-Loss": 0.0944502283089161, "Clean-Accuracy": 99.13, "Clean-Loss": 0.03496263946890831, "PGD-Accuracy": 11.32, "PGD-Loss": 3.7106846298217775}, "Total-Time": 10403.11842918396, "Train": {"Loss": 1.5340119501749674, "avg t": 1.001107034506621, "plain loss": 0.1255018279534798, "standard loss": 0.04809560086357373}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.6500015258789, "Augmented-0.05-Quantile-Accuracy": 97.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.23332977294922, "Augmented-Accuracy": 99.01533333333333, "Augmented-Loss": 0.09083008589585623, "Clean-Accuracy": 99.15, "Clean-Loss": 0.040140873392423, "PGD-Accuracy": 10.65, "PGD-Loss": 3.551177474975586}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 45, "Epoch-Time": 241.6256754398346, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.68000030517578, "Augmented-0.05-Quantile-Accuracy": 97.36000061035156, "Augmented-0.1-Quantile-Accuracy": 97.98999786376953, "Augmented-Accuracy": 98.9219, "Augmented-Loss": 0.08956449101829529, "Clean-Accuracy": 99.14, "Clean-Loss": 0.03458981079012156, "PGD-Accuracy": 11.27, "PGD-Loss": 3.930790168762207}, "Total-Time": 10644.744104623795, "Train": {"Loss": 2.191346001271848, "avg t": 1.002679613607901, "plain loss": 0.13474534568433416, "standard loss": 0.05241479754765276}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.38333129882812, "Augmented-0.05-Quantile-Accuracy": 97.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.19999694824219, "Augmented-Accuracy": 99.04866666666666, "Augmented-Loss": 0.08347279664506514, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.036863138907278575, "PGD-Accuracy": 10.666666666666666, "PGD-Loss": 3.730103411356608}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 46, "Epoch-Time": 241.48786401748657, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.66999816894531, "Augmented-0.05-Quantile-Accuracy": 97.3699951171875, "Augmented-0.1-Quantile-Accuracy": 97.97999572753906, "Augmented-Accuracy": 99.0005, "Augmented-Loss": 0.09266978996491432, "Clean-Accuracy": 99.2, "Clean-Loss": 0.03500512539148331, "PGD-Accuracy": 10.93, "PGD-Loss": 3.8357546752929688}, "Total-Time": 10886.231968641281, "Train": {"Loss": 1.7305163584108705, "avg t": 1.002925755571436, "plain loss": 0.12496525808440312, "standard loss": 0.047409339959767684}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.48332977294922, "Augmented-0.05-Quantile-Accuracy": 97.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.28333282470703, "Augmented-Accuracy": 99.00233333333334, "Augmented-Loss": 0.08386206553359826, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.03950312175850074, "PGD-Accuracy": 10.45, "PGD-Loss": 3.6635135498046876}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 47, "Epoch-Time": 241.43481063842773, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.5, "Augmented-0.05-Quantile-Accuracy": 96.2699966430664, "Augmented-0.1-Quantile-Accuracy": 97.02999877929688, "Augmented-Accuracy": 98.4133, "Augmented-Loss": 0.1168672625761032, "Clean-Accuracy": 98.98, "Clean-Loss": 0.04750402839481831, "PGD-Accuracy": 11.49, "PGD-Loss": 3.9690030731201174}, "Total-Time": 11127.666779279709, "Train": {"Loss": 2.0043829838081644, "avg t": 1.0030020962821113, "plain loss": 0.12932764788910203, "standard loss": 0.053009793196839315}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.38333129882812, "Augmented-0.05-Quantile-Accuracy": 97.0999984741211, "Augmented-0.1-Quantile-Accuracy": 97.46666717529297, "Augmented-Accuracy": 98.479, "Augmented-Loss": 0.11192724639236927, "Clean-Accuracy": 98.98333333333333, "Clean-Loss": 0.050870257578790185, "PGD-Accuracy": 10.9, "PGD-Loss": 3.8210068130493164}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 48, "Epoch-Time": 235.2215678691864, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.29999542236328, "Augmented-0.05-Quantile-Accuracy": 97.68000030517578, "Augmented-0.1-Quantile-Accuracy": 98.15999603271484, "Augmented-Accuracy": 99.0052, "Augmented-Loss": 0.06693300786030293, "Clean-Accuracy": 99.18, "Clean-Loss": 0.03210267763286829, "PGD-Accuracy": 11.38, "PGD-Loss": 4.016326078796387}, "Total-Time": 11362.888347148895, "Train": {"Loss": 1.8437320981908727, "avg t": 1.0027213768076013, "plain loss": 0.13069869185200447, "standard loss": 0.050709144874855325}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.83333587646484, "Augmented-0.05-Quantile-Accuracy": 98.06666564941406, "Augmented-0.1-Quantile-Accuracy": 98.36666870117188, "Augmented-Accuracy": 99.05366666666667, "Augmented-Loss": 0.06883517935385307, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.037644559006517135, "PGD-Accuracy": 10.816666666666666, "PGD-Loss": 3.7515734570821127}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 49, "Epoch-Time": 203.43825316429138, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.58999633789062, "Augmented-0.05-Quantile-Accuracy": 96.68999481201172, "Augmented-0.1-Quantile-Accuracy": 97.33999633789062, "Augmented-Accuracy": 98.6697, "Augmented-Loss": 0.11630739111161233, "Clean-Accuracy": 99.16, "Clean-Loss": 0.03854822538644075, "PGD-Accuracy": 11.08, "PGD-Loss": 3.904164956665039}, "Total-Time": 11566.326600313187, "Train": {"Loss": 1.6881034663165058, "avg t": 1.0021716082890828, "plain loss": 0.12418440787880507, "standard loss": 0.04732082914857677}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.48332977294922, "Augmented-0.05-Quantile-Accuracy": 97.3499984741211, "Augmented-0.1-Quantile-Accuracy": 97.96666717529297, "Augmented-Accuracy": 98.88933333333334, "Augmented-Loss": 0.1050387751676639, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.04282960993920763, "PGD-Accuracy": 10.2, "PGD-Loss": 3.744615348815918}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 50, "Epoch-Time": 232.1944282054901, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.32999420166016, "Augmented-0.05-Quantile-Accuracy": 97.2699966430664, "Augmented-0.1-Quantile-Accuracy": 97.79999542236328, "Augmented-Accuracy": 98.8634, "Augmented-Loss": 0.12751055807375908, "Clean-Accuracy": 99.12, "Clean-Loss": 0.041195122012496, "PGD-Accuracy": 11.45, "PGD-Loss": 3.5662370346069334}, "Total-Time": 11798.521028518677, "Train": {"Loss": 1.557378435170209, "avg t": 1.0016225149013378, "plain loss": 0.12108182198029961, "standard loss": 0.045474737825079097}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.33333587646484, "Augmented-0.05-Quantile-Accuracy": 97.8499984741211, "Augmented-0.1-Quantile-Accuracy": 98.21666717529297, "Augmented-Accuracy": 98.99916666666667, "Augmented-Loss": 0.11684980463584264, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.04396258038034042, "PGD-Accuracy": 10.533333333333333, "PGD-Loss": 3.456863650004069}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 51, "Epoch-Time": 241.4368236064911, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.44999694824219, "Augmented-0.05-Quantile-Accuracy": 97.82999420166016, "Augmented-0.1-Quantile-Accuracy": 98.32999420166016, "Augmented-Accuracy": 99.0714, "Augmented-Loss": 0.08028791502737999, "Clean-Accuracy": 99.26, "Clean-Loss": 0.033227680814266206, "PGD-Accuracy": 11.3, "PGD-Loss": 3.7856201522827146}, "Total-Time": 12039.957852125168, "Train": {"Loss": 1.623176877057111, "avg t": 1.0019192934036254, "plain loss": 0.12585096204369148, "standard loss": 0.04848286440692566}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.98332977294922, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.125, "Augmented-Loss": 0.07620439070463181, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.037943399994323654, "PGD-Accuracy": 10.616666666666667, "PGD-Loss": 3.583465741475423}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 52, "Epoch-Time": 241.66274285316467, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.36000061035156, "Augmented-0.05-Quantile-Accuracy": 97.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.20999908447266, "Augmented-Accuracy": 99.0108, "Augmented-Loss": 0.08251166924655437, "Clean-Accuracy": 99.12, "Clean-Loss": 0.03617993490695953, "PGD-Accuracy": 11.07, "PGD-Loss": 3.8423494049072264}, "Total-Time": 12281.620594978333, "Train": {"Loss": 1.8711921323846887, "avg t": 1.002932796495932, "plain loss": 0.12693701932518578, "standard loss": 0.050325889342774946}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.98332977294922, "Augmented-0.05-Quantile-Accuracy": 97.96666717529297, "Augmented-0.1-Quantile-Accuracy": 98.29999542236328, "Augmented-Accuracy": 99.03, "Augmented-Loss": 0.07634773755341769, "Clean-Accuracy": 99.15, "Clean-Loss": 0.03868851415067911, "PGD-Accuracy": 10.616666666666667, "PGD-Loss": 3.6524061800638834}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 53, "Epoch-Time": 241.46544694900513, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.7699966430664, "Augmented-0.05-Quantile-Accuracy": 97.47999572753906, "Augmented-0.1-Quantile-Accuracy": 97.88999938964844, "Augmented-Accuracy": 98.9076, "Augmented-Loss": 0.06477855437791348, "Clean-Accuracy": 99.01, "Clean-Loss": 0.03659947894364595, "PGD-Accuracy": 10.14, "PGD-Loss": 5.829053616333008}, "Total-Time": 12523.086041927338, "Train": {"Loss": 1.5716948743749548, "avg t": 1.0014008231163025, "plain loss": 0.1242865240370787, "standard loss": 0.04957577075754051}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.23332977294922, "Augmented-0.05-Quantile-Accuracy": 97.58333587646484, "Augmented-0.1-Quantile-Accuracy": 97.9000015258789, "Augmented-Accuracy": 98.816, "Augmented-Loss": 0.06822053125441074, "Clean-Accuracy": 98.9, "Clean-Loss": 0.04519544623792172, "PGD-Accuracy": 10.016666666666667, "PGD-Loss": 5.512578315734864}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 54, "Epoch-Time": 206.18009519577026, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.58999633789062, "Augmented-0.05-Quantile-Accuracy": 97.39999389648438, "Augmented-0.1-Quantile-Accuracy": 97.8699951171875, "Augmented-Accuracy": 98.9419, "Augmented-Loss": 0.08875204173803329, "Clean-Accuracy": 99.13, "Clean-Loss": 0.0341592488348484, "PGD-Accuracy": 10.95, "PGD-Loss": 3.9330714416503905}, "Total-Time": 12729.266137123108, "Train": {"Loss": 1.5810190123452081, "avg t": 1.0009133616906625, "plain loss": 0.1276954771977882, "standard loss": 0.04707519704413911}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.53333282470703, "Augmented-0.05-Quantile-Accuracy": 97.88333129882812, "Augmented-0.1-Quantile-Accuracy": 98.3499984741211, "Augmented-Accuracy": 99.0505, "Augmented-Loss": 0.08250839874337117, "Clean-Accuracy": 99.25, "Clean-Loss": 0.037373536185051, "PGD-Accuracy": 10.166666666666666, "PGD-Loss": 3.6783347282409666}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 55, "Epoch-Time": 219.47664976119995, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.43000030517578, "Augmented-0.05-Quantile-Accuracy": 97.77999877929688, "Augmented-0.1-Quantile-Accuracy": 98.18000030517578, "Augmented-Accuracy": 99.0605, "Augmented-Loss": 0.08310988896989822, "Clean-Accuracy": 99.27, "Clean-Loss": 0.03454845724105835, "PGD-Accuracy": 10.79, "PGD-Loss": 3.5941946075439453}, "Total-Time": 12948.742786884308, "Train": {"Loss": 1.7135554907763446, "avg t": 1.0022585102540476, "plain loss": 0.12669960888050213, "standard loss": 0.04853789673918099}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.23332977294922, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 99.07866666666666, "Augmented-Loss": 0.0778138653912147, "Clean-Accuracy": 99.1, "Clean-Loss": 0.03832584207629164, "PGD-Accuracy": 10.183333333333334, "PGD-Loss": 3.432696268717448}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 56, "Epoch-Time": 241.26227927207947, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.68000030517578, "Augmented-0.05-Quantile-Accuracy": 97.80999755859375, "Augmented-0.1-Quantile-Accuracy": 98.2699966430664, "Augmented-Accuracy": 99.0785, "Augmented-Loss": 0.04792363888809085, "Clean-Accuracy": 99.18, "Clean-Loss": 0.028719240384548903, "PGD-Accuracy": 11.01, "PGD-Loss": 4.788743344116211}, "Total-Time": 13190.005066156387, "Train": {"Loss": 1.526555770414847, "avg t": 1.0009449010071931, "plain loss": 0.12507595320984183, "standard loss": 0.048478893294378565}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.28333282470703, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.18633333333334, "Augmented-Loss": 0.04793316137505074, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.035237629253882914, "PGD-Accuracy": 10.283333333333333, "PGD-Loss": 4.540725296020508}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 57, "Epoch-Time": 241.4930727481842, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.95999908447266, "Augmented-0.05-Quantile-Accuracy": 97.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.04000091552734, "Augmented-Accuracy": 98.9653, "Augmented-Loss": 0.08630689242088795, "Clean-Accuracy": 99.2, "Clean-Loss": 0.034484010204672816, "PGD-Accuracy": 11.14, "PGD-Loss": 3.549112208557129}, "Total-Time": 13431.498138904572, "Train": {"Loss": 2.289941516381723, "avg t": 1.0031496657088952, "plain loss": 0.13966093875390506, "standard loss": 0.05294666589879327}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.75, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.43333435058594, "Augmented-Accuracy": 99.0465, "Augmented-Loss": 0.0798356872222821, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.03753384568914771, "PGD-Accuracy": 10.4, "PGD-Loss": 3.3647975374857584}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 58, "Epoch-Time": 241.23693299293518, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.2699966430664, "Augmented-0.05-Quantile-Accuracy": 97.22999572753906, "Augmented-0.1-Quantile-Accuracy": 97.72999572753906, "Augmented-Accuracy": 98.7724, "Augmented-Loss": 0.0908731482386589, "Clean-Accuracy": 98.95, "Clean-Loss": 0.04230536090135574, "PGD-Accuracy": 10.76, "PGD-Loss": 3.9027254974365233}, "Total-Time": 13672.735071897507, "Train": {"Loss": 1.5836929589377509, "avg t": 1.0008840889047694, "plain loss": 0.12713951023419706, "standard loss": 0.04733095683405797}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.36666870117188, "Augmented-0.05-Quantile-Accuracy": 97.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.1500015258789, "Augmented-Accuracy": 98.94383333333333, "Augmented-Loss": 0.08009371581017971, "Clean-Accuracy": 98.96666666666667, "Clean-Loss": 0.04226170472552379, "PGD-Accuracy": 10.05, "PGD-Loss": 3.7609356816609703}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 59, "Epoch-Time": 233.99434161186218, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.0, "Augmented-0.05-Quantile-Accuracy": 97.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.0, "Augmented-Accuracy": 98.8913, "Augmented-Loss": 0.06331252072161436, "Clean-Accuracy": 99.17, "Clean-Loss": 0.031034687381982805, "PGD-Accuracy": 10.49, "PGD-Loss": 4.9445148345947265}, "Total-Time": 13906.729413509369, "Train": {"Loss": 1.9475136619850442, "avg t": 1.0027837320610329, "plain loss": 0.12799121391155088, "standard loss": 0.051950684447600336}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.81666564941406, "Augmented-0.05-Quantile-Accuracy": 97.98332977294922, "Augmented-0.1-Quantile-Accuracy": 98.38333129882812, "Augmented-Accuracy": 99.0365, "Augmented-Loss": 0.06388652323072155, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.038478126826385656, "PGD-Accuracy": 9.983333333333333, "PGD-Loss": 4.694376508076986}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 60, "Epoch-Time": 203.87711358070374, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.79000091552734, "Augmented-0.05-Quantile-Accuracy": 97.88999938964844, "Augmented-0.1-Quantile-Accuracy": 98.27999877929688, "Augmented-Accuracy": 99.0263, "Augmented-Loss": 0.045349058843672276, "Clean-Accuracy": 99.15, "Clean-Loss": 0.03270626804251224, "PGD-Accuracy": 9.95, "PGD-Loss": 5.740531488037109}, "Total-Time": 14110.606527090073, "Train": {"Loss": 1.7233295868767633, "avg t": 1.0015425090436583, "plain loss": 0.12716520548749857, "standard loss": 0.048768726736514105}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.41666412353516, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 99.138, "Augmented-Loss": 0.047361910093364615, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.03955298171696874, "PGD-Accuracy": 9.366666666666667, "PGD-Loss": 5.417157432556152}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 61, "Epoch-Time": 232.54336094856262, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.75, "Augmented-0.05-Quantile-Accuracy": 97.30999755859375, "Augmented-0.1-Quantile-Accuracy": 97.88999938964844, "Augmented-Accuracy": 98.8555, "Augmented-Loss": 0.05363996707868576, "Clean-Accuracy": 98.92, "Clean-Loss": 0.03759047635570169, "PGD-Accuracy": 9.85, "PGD-Loss": 6.072912924194336}, "Total-Time": 14343.149888038635, "Train": {"Loss": 1.6680774081194842, "avg t": 1.0017163130618907, "plain loss": 0.12342231821660635, "standard loss": 0.048691176059345406}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.73332977294922, "Augmented-0.05-Quantile-Accuracy": 97.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.1500015258789, "Augmented-Accuracy": 98.90766666666667, "Augmented-Loss": 0.052523957581756014, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.041310802033481496, "PGD-Accuracy": 9.15, "PGD-Loss": 5.6140004272460935}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 62, "Epoch-Time": 241.61406636238098, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.47999572753906, "Augmented-0.05-Quantile-Accuracy": 97.66999816894531, "Augmented-0.1-Quantile-Accuracy": 98.16999816894531, "Augmented-Accuracy": 99.0156, "Augmented-Loss": 0.08662476624906063, "Clean-Accuracy": 99.13, "Clean-Loss": 0.035906170749664304, "PGD-Accuracy": 11.34, "PGD-Loss": 3.5297141662597658}, "Total-Time": 14584.763954401016, "Train": {"Loss": 1.4864447450284604, "avg t": 1.0002647312658803, "plain loss": 0.1195515721056196, "standard loss": 0.04399969957199776}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.21666717529297, "Augmented-0.1-Quantile-Accuracy": 98.56666564941406, "Augmented-Accuracy": 99.06733333333334, "Augmented-Loss": 0.07927563407669465, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.039868889284630615, "PGD-Accuracy": 10.566666666666666, "PGD-Loss": 3.4393612569173175}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 63, "Epoch-Time": 241.65072178840637, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.97000122070312, "Augmented-0.05-Quantile-Accuracy": 97.90999603271484, "Augmented-0.1-Quantile-Accuracy": 98.18000030517578, "Augmented-Accuracy": 98.988, "Augmented-Loss": 0.035396352206937036, "Clean-Accuracy": 99.08, "Clean-Loss": 0.036518688624969216, "PGD-Accuracy": 13.33, "PGD-Loss": 10.972580419921876}, "Total-Time": 14826.414676189423, "Train": {"Loss": 2.2472194995880126, "avg t": 1.001981841723124, "plain loss": 0.12864340048366113, "standard loss": 0.05148761090784575}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.4000015258789, "Augmented-0.05-Quantile-Accuracy": 98.26666259765625, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 99.0995, "Augmented-Loss": 0.04157432739513344, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.04466957496838101, "PGD-Accuracy": 13.6, "PGD-Loss": 10.389602747599284}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 64, "Epoch-Time": 241.52338075637817, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.3499984741211, "Augmented-0.05-Quantile-Accuracy": 97.14999389648438, "Augmented-0.1-Quantile-Accuracy": 97.69999694824219, "Augmented-Accuracy": 98.7782, "Augmented-Loss": 0.05588479075652361, "Clean-Accuracy": 98.92, "Clean-Loss": 0.04105867476472631, "PGD-Accuracy": 11.74, "PGD-Loss": 7.625684948730469}, "Total-Time": 15067.9380569458, "Train": {"Loss": 9.063898936801486, "avg t": 1.0451067935095892, "plain loss": 0.30092753323802257, "standard loss": 0.19106947420390874}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.08333587646484, "Augmented-0.05-Quantile-Accuracy": 97.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.04999542236328, "Augmented-Accuracy": 98.902, "Augmented-Loss": 0.05373978194601834, "Clean-Accuracy": 98.93333333333334, "Clean-Loss": 0.046483572441890525, "PGD-Accuracy": 11.716666666666667, "PGD-Loss": 7.199817504882812}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 65, "Epoch-Time": 206.23820424079895, "Test": {"Augmented-0.01-Quantile-Accuracy": 90.63999938964844, "Augmented-0.05-Quantile-Accuracy": 94.63999938964844, "Augmented-0.1-Quantile-Accuracy": 95.90999603271484, "Augmented-Accuracy": 97.873, "Augmented-Loss": 0.17897985465431213, "Clean-Accuracy": 98.86, "Clean-Loss": 0.05171957364976406, "PGD-Accuracy": 10.91, "PGD-Loss": 4.74446953125}, "Total-Time": 15274.1762611866, "Train": {"Loss": 7.640645146687826, "avg t": 1.0347986818949382, "plain loss": 0.26270512851432487, "standard loss": 0.1401420042015336}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 92.1500015258789, "Augmented-0.05-Quantile-Accuracy": 95.58333587646484, "Augmented-0.1-Quantile-Accuracy": 96.54999542236328, "Augmented-Accuracy": 98.241, "Augmented-Loss": 0.15417490443487963, "Clean-Accuracy": 98.86666666666666, "Clean-Loss": 0.04851484273870786, "PGD-Accuracy": 10.116666666666667, "PGD-Loss": 4.618334760030111}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 66, "Epoch-Time": 219.38476634025574, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.63999938964844, "Augmented-0.05-Quantile-Accuracy": 96.27999877929688, "Augmented-0.1-Quantile-Accuracy": 97.18000030517578, "Augmented-Accuracy": 98.5678, "Augmented-Loss": 0.11676408379030227, "Clean-Accuracy": 98.95, "Clean-Loss": 0.04216219242960215, "PGD-Accuracy": 10.72, "PGD-Loss": 5.476921923828125}, "Total-Time": 15493.561027526855, "Train": {"Loss": 3.666052164501614, "avg t": 1.017886934209753, "plain loss": 0.19214508158189267, "standard loss": 0.09317748107968105}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.0999984741211, "Augmented-0.05-Quantile-Accuracy": 96.63333129882812, "Augmented-0.1-Quantile-Accuracy": 97.5, "Augmented-Accuracy": 98.618, "Augmented-Loss": 0.10595196201841037, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.0465803887580211, "PGD-Accuracy": 10.3, "PGD-Loss": 5.1814794413248695}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 67, "Epoch-Time": 241.3911280632019, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.04000091552734, "Augmented-0.05-Quantile-Accuracy": 96.44999694824219, "Augmented-0.1-Quantile-Accuracy": 97.12999725341797, "Augmented-Accuracy": 98.603, "Augmented-Loss": 0.12986916785216332, "Clean-Accuracy": 98.97, "Clean-Loss": 0.06818041234016418, "PGD-Accuracy": 12.01, "PGD-Loss": 4.554032234191895}, "Total-Time": 15734.952155590057, "Train": {"Loss": 3.1158412837628964, "avg t": 1.0150246656912345, "plain loss": 0.18030609839050857, "standard loss": 0.09740553647666066}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.86666870117188, "Augmented-0.05-Quantile-Accuracy": 96.9000015258789, "Augmented-0.1-Quantile-Accuracy": 97.54999542236328, "Augmented-Accuracy": 98.67716666666666, "Augmented-Loss": 0.11364155585030715, "Clean-Accuracy": 98.9, "Clean-Loss": 0.06430647080143292, "PGD-Accuracy": 11.366666666666667, "PGD-Loss": 4.445671765645345}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 68, "Epoch-Time": 241.86487555503845, "Test": {"Augmented-0.01-Quantile-Accuracy": 90.77999877929688, "Augmented-0.05-Quantile-Accuracy": 94.8699951171875, "Augmented-0.1-Quantile-Accuracy": 96.02999877929688, "Augmented-Accuracy": 98.0547, "Augmented-Loss": 0.17681843627786636, "Clean-Accuracy": 98.72, "Clean-Loss": 0.05811662917137146, "PGD-Accuracy": 10.82, "PGD-Loss": 4.524804873657226}, "Total-Time": 15976.817031145096, "Train": {"Loss": 3.0658597027813945, "avg t": 1.014199868272852, "plain loss": 0.1753549525525834, "standard loss": 0.10193850610943304}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 92.81666564941406, "Augmented-0.05-Quantile-Accuracy": 95.93333435058594, "Augmented-0.1-Quantile-Accuracy": 96.68333435058594, "Augmented-Accuracy": 98.37783333333333, "Augmented-Loss": 0.15822101591626803, "Clean-Accuracy": 98.86666666666666, "Clean-Loss": 0.053714197285473345, "PGD-Accuracy": 10.2, "PGD-Loss": 4.341473642985026}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 69, "Epoch-Time": 241.64131093025208, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.90999603271484, "Augmented-0.05-Quantile-Accuracy": 96.87999725341797, "Augmented-0.1-Quantile-Accuracy": 97.6199951171875, "Augmented-Accuracy": 98.7306, "Augmented-Loss": 0.07993086068379879, "Clean-Accuracy": 99.05, "Clean-Loss": 0.045643210735917095, "PGD-Accuracy": 12.54, "PGD-Loss": 5.526086538696289}, "Total-Time": 16218.458342075348, "Train": {"Loss": 2.785134979389332, "avg t": 1.0127318416524815, "plain loss": 0.17063018409940922, "standard loss": 0.1013780217282474}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.9000015258789, "Augmented-0.05-Quantile-Accuracy": 97.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.13333129882812, "Augmented-Accuracy": 98.96266666666666, "Augmented-Loss": 0.07293170602202416, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.04726456786940495, "PGD-Accuracy": 12.3, "PGD-Loss": 5.2066465098063155}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 70, "Epoch-Time": 232.73924326896667, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.83999633789062, "Augmented-0.05-Quantile-Accuracy": 96.83999633789062, "Augmented-0.1-Quantile-Accuracy": 97.54000091552734, "Augmented-Accuracy": 98.7864, "Augmented-Loss": 0.11863337326240539, "Clean-Accuracy": 99.12, "Clean-Loss": 0.060813177073001864, "PGD-Accuracy": 12.7, "PGD-Loss": 4.005859283447266}, "Total-Time": 16451.197585344315, "Train": {"Loss": 2.6839816244619863, "avg t": 1.0106316776275635, "plain loss": 0.16569309363541773, "standard loss": 0.0973175137316877}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.56666564941406, "Augmented-0.05-Quantile-Accuracy": 97.21666717529297, "Augmented-0.1-Quantile-Accuracy": 97.54999542236328, "Augmented-Accuracy": 98.7575, "Augmented-Loss": 0.10755663836757343, "Clean-Accuracy": 98.93333333333334, "Clean-Loss": 0.06063555247088273, "PGD-Accuracy": 12.116666666666667, "PGD-Loss": 3.860748977661133}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 71, "Epoch-Time": 204.37010598182678, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.07999420166016, "Augmented-0.05-Quantile-Accuracy": 95.93000030517578, "Augmented-0.1-Quantile-Accuracy": 96.93999481201172, "Augmented-Accuracy": 98.5076, "Augmented-Loss": 0.08292599481862784, "Clean-Accuracy": 98.8, "Clean-Loss": 0.04359746083021164, "PGD-Accuracy": 10.88, "PGD-Loss": 6.855070190429688}, "Total-Time": 16655.56769132614, "Train": {"Loss": 2.741083556846336, "avg t": 1.0116474474447745, "plain loss": 0.16502378276454063, "standard loss": 0.09136258642085725}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.38333129882812, "Augmented-0.05-Quantile-Accuracy": 96.78333282470703, "Augmented-0.1-Quantile-Accuracy": 97.5, "Augmented-Accuracy": 98.68516666666666, "Augmented-Loss": 0.07834963382408022, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.055464497624275584, "PGD-Accuracy": 10.5, "PGD-Loss": 6.379461128234864}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 72, "Epoch-Time": 233.27772665023804, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.37999725341797, "Augmented-0.05-Quantile-Accuracy": 96.70999908447266, "Augmented-0.1-Quantile-Accuracy": 97.30999755859375, "Augmented-Accuracy": 98.6097, "Augmented-Loss": 0.10542916879224777, "Clean-Accuracy": 98.93, "Clean-Loss": 0.05355788044333458, "PGD-Accuracy": 14.35, "PGD-Loss": 6.2224185760498045}, "Total-Time": 16888.84541797638, "Train": {"Loss": 2.4562336899792707, "avg t": 1.009798874784399, "plain loss": 0.1614429375083357, "standard loss": 0.08798677371635481}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.58333587646484, "Augmented-0.05-Quantile-Accuracy": 97.28333282470703, "Augmented-0.1-Quantile-Accuracy": 97.83333587646484, "Augmented-Accuracy": 98.76433333333334, "Augmented-Loss": 0.09422308887680371, "Clean-Accuracy": 99.05, "Clean-Loss": 0.05422673053542773, "PGD-Accuracy": 14.2, "PGD-Loss": 5.9580891265869145}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 73, "Epoch-Time": 241.52158546447754, "Test": {"Augmented-0.01-Quantile-Accuracy": 92.54000091552734, "Augmented-0.05-Quantile-Accuracy": 95.38999938964844, "Augmented-0.1-Quantile-Accuracy": 96.43999481201172, "Augmented-Accuracy": 98.1691, "Augmented-Loss": 0.14959187116479875, "Clean-Accuracy": 98.83, "Clean-Loss": 0.07969278345108033, "PGD-Accuracy": 12.05, "PGD-Loss": 4.258106802368164}, "Total-Time": 17130.367003440857, "Train": {"Loss": 2.7214173748228285, "avg t": 1.0099644805413706, "plain loss": 0.16288270153469528, "standard loss": 0.0892875277582142}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 93.9000015258789, "Augmented-0.05-Quantile-Accuracy": 96.33333587646484, "Augmented-0.1-Quantile-Accuracy": 97.1500015258789, "Augmented-Accuracy": 98.49216666666666, "Augmented-Loss": 0.1334665672691663, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.0736720565110445, "PGD-Accuracy": 11.783333333333333, "PGD-Loss": 4.05118972269694}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 74, "Epoch-Time": 241.51810836791992, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.44999694824219, "Augmented-0.05-Quantile-Accuracy": 96.64999389648438, "Augmented-0.1-Quantile-Accuracy": 97.32999420166016, "Augmented-Accuracy": 98.6048, "Augmented-Loss": 0.09995964751398563, "Clean-Accuracy": 98.86, "Clean-Loss": 0.05780307768285275, "PGD-Accuracy": 12.64, "PGD-Loss": 5.092651513671875}, "Total-Time": 17371.885111808777, "Train": {"Loss": 2.2483626090155706, "avg t": 1.008829353208895, "plain loss": 0.15774582289236572, "standard loss": 0.08768521692548636}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.44999694824219, "Augmented-0.05-Quantile-Accuracy": 97.29999542236328, "Augmented-0.1-Quantile-Accuracy": 97.81666564941406, "Augmented-Accuracy": 98.80583333333334, "Augmented-Loss": 0.09413053309003512, "Clean-Accuracy": 98.95, "Clean-Loss": 0.05898477381716172, "PGD-Accuracy": 12.116666666666667, "PGD-Loss": 4.753241490681966}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 75, "Epoch-Time": 241.4472758769989, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.25, "Augmented-0.05-Quantile-Accuracy": 96.98999786376953, "Augmented-0.1-Quantile-Accuracy": 97.69999694824219, "Augmented-Accuracy": 98.7905, "Augmented-Loss": 0.07343016397202015, "Clean-Accuracy": 99.03, "Clean-Loss": 0.04282115352749825, "PGD-Accuracy": 10.89, "PGD-Loss": 6.330705606079102}, "Total-Time": 17613.332387685776, "Train": {"Loss": 2.4906102376867225, "avg t": 1.009882208082411, "plain loss": 0.15880021109051187, "standard loss": 0.08517805637729664}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.26666259765625, "Augmented-0.05-Quantile-Accuracy": 97.83333587646484, "Augmented-0.1-Quantile-Accuracy": 98.16666412353516, "Augmented-Accuracy": 98.93166666666667, "Augmented-Loss": 0.06644678180143238, "Clean-Accuracy": 98.88333333333334, "Clean-Loss": 0.04622394015888373, "PGD-Accuracy": 11.366666666666667, "PGD-Loss": 5.9401159159342445}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 76, "Epoch-Time": 205.14268970489502, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.54999542236328, "Augmented-0.05-Quantile-Accuracy": 97.18000030517578, "Augmented-0.1-Quantile-Accuracy": 97.63999938964844, "Augmented-Accuracy": 98.7118, "Augmented-Loss": 0.04932967793478444, "Clean-Accuracy": 98.9, "Clean-Loss": 0.043410085123451424, "PGD-Accuracy": 16.4, "PGD-Loss": 11.516758575439454}, "Total-Time": 17818.47507739067, "Train": {"Loss": 2.8848824869791665, "avg t": 1.0098498972433585, "plain loss": 0.1661366949964453, "standard loss": 0.08461785838352862}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.6500015258789, "Augmented-0.05-Quantile-Accuracy": 97.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.18333435058594, "Augmented-Accuracy": 98.94883333333334, "Augmented-Loss": 0.051347969994569816, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.053722646638130145, "PGD-Accuracy": 17.25, "PGD-Loss": 11.237845448811848}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 77, "Epoch-Time": 219.0476565361023, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.43000030517578, "Augmented-0.05-Quantile-Accuracy": 97.07999420166016, "Augmented-0.1-Quantile-Accuracy": 97.68999481201172, "Augmented-Accuracy": 98.7872, "Augmented-Loss": 0.0969877637695074, "Clean-Accuracy": 99.02, "Clean-Loss": 0.0515433733522892, "PGD-Accuracy": 15.02, "PGD-Loss": 5.898088415527344}, "Total-Time": 18037.522733926773, "Train": {"Loss": 2.169647702252423, "avg t": 1.0075519612630208, "plain loss": 0.1559738983701775, "standard loss": 0.0803248641258623}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.0999984741211, "Augmented-0.05-Quantile-Accuracy": 97.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.01666259765625, "Augmented-Accuracy": 98.85683333333333, "Augmented-Loss": 0.08680216210305691, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.05361111690600713, "PGD-Accuracy": 15.5, "PGD-Loss": 5.6467897313435875}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 78, "Epoch-Time": 241.52653050422668, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.70999908447266, "Augmented-0.05-Quantile-Accuracy": 97.43000030517578, "Augmented-0.1-Quantile-Accuracy": 98.0, "Augmented-Accuracy": 98.9693, "Augmented-Loss": 0.07366116275894642, "Clean-Accuracy": 99.12, "Clean-Loss": 0.0391503033131361, "PGD-Accuracy": 13.1, "PGD-Loss": 4.747134237670898}, "Total-Time": 18279.049264431, "Train": {"Loss": 2.3253880123915494, "avg t": 1.0074664095066213, "plain loss": 0.15191333509374547, "standard loss": 0.08068568083381764}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.51666259765625, "Augmented-0.05-Quantile-Accuracy": 97.86666870117188, "Augmented-0.1-Quantile-Accuracy": 98.21666717529297, "Augmented-Accuracy": 98.98166666666667, "Augmented-Loss": 0.06982064863130451, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.0445199177612861, "PGD-Accuracy": 12.25, "PGD-Loss": 4.63519936243693}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 79, "Epoch-Time": 241.73381662368774, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.93999481201172, "Augmented-0.05-Quantile-Accuracy": 97.39999389648438, "Augmented-0.1-Quantile-Accuracy": 97.93000030517578, "Augmented-Accuracy": 98.9603, "Augmented-Loss": 0.0757156619386673, "Clean-Accuracy": 99.13, "Clean-Loss": 0.04003235857486725, "PGD-Accuracy": 12.35, "PGD-Loss": 5.111626525878906}, "Total-Time": 18520.783081054688, "Train": {"Loss": 3.07121043032187, "avg t": 1.009191718172144, "plain loss": 0.16242337368505963, "standard loss": 0.08511898418681489}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.68333435058594, "Augmented-0.05-Quantile-Accuracy": 97.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.33333587646484, "Augmented-Accuracy": 99.0605, "Augmented-Loss": 0.07088522028381626, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.04330705163503686, "PGD-Accuracy": 12.066666666666666, "PGD-Loss": 4.852090476989746}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 80, "Epoch-Time": 241.69180822372437, "Test": {"Augmented-0.01-Quantile-Accuracy": 92.54000091552734, "Augmented-0.05-Quantile-Accuracy": 94.89999389648438, "Augmented-0.1-Quantile-Accuracy": 95.54000091552734, "Augmented-Accuracy": 97.4332, "Augmented-Loss": 0.12365253126807069, "Clean-Accuracy": 97.98, "Clean-Loss": 0.13211556807905908, "PGD-Accuracy": 4.68, "PGD-Loss": 21.988162365722655}, "Total-Time": 18762.474889278412, "Train": {"Loss": 2.068929329695525, "avg t": 1.0067900013747038, "plain loss": 0.15062636041641211, "standard loss": 0.07279922783912884}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 93.96666717529297, "Augmented-0.05-Quantile-Accuracy": 96.16666412353516, "Augmented-0.1-Quantile-Accuracy": 96.66666412353516, "Augmented-Accuracy": 97.9985, "Augmented-Loss": 0.11075806643228352, "Clean-Accuracy": 98.4, "Clean-Loss": 0.12040974016176142, "PGD-Accuracy": 4.966666666666667, "PGD-Loss": 20.814022725423175}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 81, "Epoch-Time": 232.1046543121338, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.41999816894531, "Augmented-0.05-Quantile-Accuracy": 97.58999633789062, "Augmented-0.1-Quantile-Accuracy": 97.89999389648438, "Augmented-Accuracy": 98.8421, "Augmented-Loss": 0.047360803452811844, "Clean-Accuracy": 99.08, "Clean-Loss": 0.04688817119588675, "PGD-Accuracy": 7.54, "PGD-Loss": 28.782302490234375}, "Total-Time": 18994.579543590546, "Train": {"Loss": 2.132668093716657, "avg t": 1.0069030415570295, "plain loss": 0.15192927281591637, "standard loss": 0.0720141135227901}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.9000015258789, "Augmented-0.05-Quantile-Accuracy": 98.01666259765625, "Augmented-0.1-Quantile-Accuracy": 98.48332977294922, "Augmented-Accuracy": 99.01066666666667, "Augmented-Loss": 0.05397724898114281, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.059474455290927535, "PGD-Accuracy": 7.75, "PGD-Loss": 28.48636092122396}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 82, "Epoch-Time": 204.57480597496033, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.94999694824219, "Augmented-0.05-Quantile-Accuracy": 96.88999938964844, "Augmented-0.1-Quantile-Accuracy": 97.50999450683594, "Augmented-Accuracy": 98.6601, "Augmented-Loss": 0.10278622711753846, "Clean-Accuracy": 99.1, "Clean-Loss": 0.050218649154901505, "PGD-Accuracy": 12.46, "PGD-Loss": 4.973392678833008}, "Total-Time": 19199.154349565506, "Train": {"Loss": 1.9742514288513748, "avg t": 1.0061716081831191, "plain loss": 0.14837483516445854, "standard loss": 0.07194611348494612}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.71666717529297, "Augmented-0.05-Quantile-Accuracy": 97.4000015258789, "Augmented-0.1-Quantile-Accuracy": 98.03333282470703, "Augmented-Accuracy": 98.86816666666667, "Augmented-Loss": 0.09306734660764535, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.05083331560716033, "PGD-Accuracy": 11.683333333333334, "PGD-Loss": 4.7963781127929686}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 83, "Epoch-Time": 233.35009622573853, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.44999694824219, "Augmented-0.05-Quantile-Accuracy": 96.66999816894531, "Augmented-0.1-Quantile-Accuracy": 97.36000061035156, "Augmented-Accuracy": 98.644, "Augmented-Loss": 0.08229781265377999, "Clean-Accuracy": 99.08, "Clean-Loss": 0.03760178103819489, "PGD-Accuracy": 11.65, "PGD-Loss": 5.4425723785400395}, "Total-Time": 19432.504445791245, "Train": {"Loss": 2.1017341111147845, "avg t": 1.0063554913556134, "plain loss": 0.15071600960802162, "standard loss": 0.07375598226432448}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.53333282470703, "Augmented-0.05-Quantile-Accuracy": 97.19999694824219, "Augmented-0.1-Quantile-Accuracy": 97.75, "Augmented-Accuracy": 98.79066666666667, "Augmented-Loss": 0.07781598822464546, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.046763745438307525, "PGD-Accuracy": 11.033333333333333, "PGD-Loss": 5.165890426635742}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 84, "Epoch-Time": 241.55972409248352, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.32999420166016, "Augmented-0.05-Quantile-Accuracy": 97.30999755859375, "Augmented-0.1-Quantile-Accuracy": 97.83999633789062, "Augmented-Accuracy": 98.8559, "Augmented-Loss": 0.0912087839000225, "Clean-Accuracy": 99.06, "Clean-Loss": 0.04520481557846069, "PGD-Accuracy": 11.99, "PGD-Loss": 5.221753756713867}, "Total-Time": 19674.064169883728, "Train": {"Loss": 1.876550100043968, "avg t": 1.0054271541171604, "plain loss": 0.14357068339277193, "standard loss": 0.06886702128789492}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.86666870117188, "Augmented-0.05-Quantile-Accuracy": 97.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.0, "Augmented-Accuracy": 98.83183333333334, "Augmented-Loss": 0.08301427287062009, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.04844487871726354, "PGD-Accuracy": 11.383333333333333, "PGD-Loss": 4.9978628362019855}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 85, "Epoch-Time": 241.4742352962494, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.81999969482422, "Augmented-0.05-Quantile-Accuracy": 97.39999389648438, "Augmented-0.1-Quantile-Accuracy": 97.87999725341797, "Augmented-Accuracy": 98.9438, "Augmented-Loss": 0.08718522825336457, "Clean-Accuracy": 99.15, "Clean-Loss": 0.05094661048054695, "PGD-Accuracy": 12.92, "PGD-Loss": 4.679416348266601}, "Total-Time": 19915.538405179977, "Train": {"Loss": 2.2005447733490557, "avg t": 1.0069343879311172, "plain loss": 0.15354114590044377, "standard loss": 0.07786367076138655}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.56666564941406, "Augmented-0.05-Quantile-Accuracy": 97.93333435058594, "Augmented-0.1-Quantile-Accuracy": 98.26666259765625, "Augmented-Accuracy": 99.01016666666666, "Augmented-Loss": 0.07630941855390867, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.04919209623585145, "PGD-Accuracy": 12.733333333333333, "PGD-Loss": 4.589171330769857}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 86, "Epoch-Time": 241.568514585495, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.39999389648438, "Augmented-0.05-Quantile-Accuracy": 97.0999984741211, "Augmented-0.1-Quantile-Accuracy": 97.62999725341797, "Augmented-Accuracy": 98.8675, "Augmented-Loss": 0.10958981792140007, "Clean-Accuracy": 99.12, "Clean-Loss": 0.04519373558163643, "PGD-Accuracy": 11.23, "PGD-Loss": 4.429459941101074}, "Total-Time": 20157.106919765472, "Train": {"Loss": 1.8851262768639458, "avg t": 1.0051709330700063, "plain loss": 0.14855072118971102, "standard loss": 0.0771101904630799}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.13333129882812, "Augmented-0.05-Quantile-Accuracy": 97.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.04999542236328, "Augmented-Accuracy": 98.829, "Augmented-Loss": 0.10304766670723756, "Clean-Accuracy": 98.96666666666667, "Clean-Loss": 0.050271629571914674, "PGD-Accuracy": 10.566666666666666, "PGD-Loss": 4.286855026245117}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 87, "Epoch-Time": 206.21854281425476, "Test": {"Augmented-0.01-Quantile-Accuracy": 83.22999572753906, "Augmented-0.05-Quantile-Accuracy": 90.48999786376953, "Augmented-0.1-Quantile-Accuracy": 92.68000030517578, "Augmented-Accuracy": 96.2293, "Augmented-Loss": 0.2294465233285427, "Clean-Accuracy": 97.78, "Clean-Loss": 0.09441468840092421, "PGD-Accuracy": 10.84, "PGD-Loss": 7.7843784362792965}, "Total-Time": 20363.325462579727, "Train": {"Loss": 3.7049131600415266, "avg t": 1.0144340986322473, "plain loss": 0.18821441749290183, "standard loss": 0.10488818152855944}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 86.04999542236328, "Augmented-0.05-Quantile-Accuracy": 92.18333435058594, "Augmented-0.1-Quantile-Accuracy": 94.04999542236328, "Augmented-Accuracy": 96.75066666666666, "Augmented-Loss": 0.19271783488353095, "Clean-Accuracy": 98.01666666666667, "Clean-Loss": 0.09064012800032893, "PGD-Accuracy": 9.8, "PGD-Loss": 7.892468139648438}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 88, "Epoch-Time": 219.9562578201294, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.77999877929688, "Augmented-0.05-Quantile-Accuracy": 96.27999877929688, "Augmented-0.1-Quantile-Accuracy": 96.90999603271484, "Augmented-Accuracy": 98.3589, "Augmented-Loss": 0.1035822797755003, "Clean-Accuracy": 98.79, "Clean-Loss": 0.0558513347953558, "PGD-Accuracy": 11.56, "PGD-Loss": 6.557900131225586}, "Total-Time": 20583.281720399857, "Train": {"Loss": 2.9552559599699797, "avg t": 1.0161659176437943, "plain loss": 0.1796656339751348, "standard loss": 0.0829991122185839}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.88333129882812, "Augmented-0.05-Quantile-Accuracy": 96.96666717529297, "Augmented-0.1-Quantile-Accuracy": 97.58333587646484, "Augmented-Accuracy": 98.6665, "Augmented-Loss": 0.08700390126188597, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.049315675564110276, "PGD-Accuracy": 11.833333333333334, "PGD-Loss": 6.404838859558105}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 89, "Epoch-Time": 241.71416568756104, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.68999481201172, "Augmented-0.05-Quantile-Accuracy": 96.97999572753906, "Augmented-0.1-Quantile-Accuracy": 97.66999816894531, "Augmented-Accuracy": 98.7459, "Augmented-Loss": 0.10434510427212715, "Clean-Accuracy": 99.0, "Clean-Loss": 0.046559873580932616, "PGD-Accuracy": 11.78, "PGD-Loss": 6.479317199707031}, "Total-Time": 20824.995886087418, "Train": {"Loss": 2.6438224805902553, "avg t": 1.0119568126819751, "plain loss": 0.16830540143295597, "standard loss": 0.07893754068827602}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.8499984741211, "Augmented-0.05-Quantile-Accuracy": 97.26666259765625, "Augmented-0.1-Quantile-Accuracy": 97.69999694824219, "Augmented-Accuracy": 98.7215, "Augmented-Loss": 0.0972844860080878, "Clean-Accuracy": 99.05, "Clean-Loss": 0.04907081349814932, "PGD-Accuracy": 11.183333333333334, "PGD-Loss": 6.169444175720215}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 90, "Epoch-Time": 241.72208070755005, "Test": {"Augmented-0.01-Quantile-Accuracy": 91.98999786376953, "Augmented-0.05-Quantile-Accuracy": 95.43000030517578, "Augmented-0.1-Quantile-Accuracy": 96.6199951171875, "Augmented-Accuracy": 98.2816, "Augmented-Loss": 0.2182632686958313, "Clean-Accuracy": 99.12, "Clean-Loss": 0.07822243764400483, "PGD-Accuracy": 11.45, "PGD-Loss": 3.907163105773926}, "Total-Time": 21066.717966794968, "Train": {"Loss": 2.7598253538696853, "avg t": 1.0118839442641647, "plain loss": 0.1670892998766015, "standard loss": 0.08090568510015253}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 93.04999542236328, "Augmented-0.05-Quantile-Accuracy": 95.68333435058594, "Augmented-0.1-Quantile-Accuracy": 96.5999984741211, "Augmented-Accuracy": 98.23933333333333, "Augmented-Loss": 0.19167602577527365, "Clean-Accuracy": 98.95, "Clean-Loss": 0.07141220719615618, "PGD-Accuracy": 10.7, "PGD-Loss": 3.7739353205362955}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 91, "Epoch-Time": 241.71229076385498, "Test": {"Augmented-0.01-Quantile-Accuracy": 91.08999633789062, "Augmented-0.05-Quantile-Accuracy": 94.8499984741211, "Augmented-0.1-Quantile-Accuracy": 95.97999572753906, "Augmented-Accuracy": 98.0044, "Augmented-Loss": 0.1741301642024517, "Clean-Accuracy": 98.74, "Clean-Loss": 0.06807862872332335, "PGD-Accuracy": 10.68, "PGD-Loss": 6.924295004272461}, "Total-Time": 21308.430257558823, "Train": {"Loss": 18.506806933650264, "avg t": 1.1475016140407985, "plain loss": 0.6250768438692443, "standard loss": 0.49402469170783403}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 92.5, "Augmented-0.05-Quantile-Accuracy": 95.86666870117188, "Augmented-0.1-Quantile-Accuracy": 96.6500015258789, "Augmented-Accuracy": 98.27, "Augmented-Loss": 0.1567280821845929, "Clean-Accuracy": 98.78333333333333, "Clean-Loss": 0.06619474683205287, "PGD-Accuracy": 10.016666666666667, "PGD-Loss": 6.7691045633951825}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 92, "Epoch-Time": 230.9616882801056, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.86000061035156, "Augmented-0.05-Quantile-Accuracy": 96.12999725341797, "Augmented-0.1-Quantile-Accuracy": 96.97999572753906, "Augmented-Accuracy": 98.4735, "Augmented-Loss": 0.07968118192970752, "Clean-Accuracy": 98.79, "Clean-Loss": 0.04729777151718736, "PGD-Accuracy": 10.28, "PGD-Loss": 8.591642041015625}, "Total-Time": 21539.39194583893, "Train": {"Loss": 3.949086832682292, "avg t": 1.0273657151681406, "plain loss": 0.24338224546820994, "standard loss": 0.11782049450002335}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.48332977294922, "Augmented-0.05-Quantile-Accuracy": 96.9000015258789, "Augmented-0.1-Quantile-Accuracy": 97.48332977294922, "Augmented-Accuracy": 98.711, "Augmented-Loss": 0.07144510919036964, "Clean-Accuracy": 98.96666666666667, "Clean-Loss": 0.04780069793667644, "PGD-Accuracy": 10.133333333333333, "PGD-Loss": 8.324676895141602}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 93, "Epoch-Time": 205.4885458946228, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.15999603271484, "Augmented-0.05-Quantile-Accuracy": 96.41999816894531, "Augmented-0.1-Quantile-Accuracy": 97.16999816894531, "Augmented-Accuracy": 98.5862, "Augmented-Loss": 0.1036052786796093, "Clean-Accuracy": 98.91, "Clean-Loss": 0.045521444128453735, "PGD-Accuracy": 10.5, "PGD-Loss": 7.84328088684082}, "Total-Time": 21744.88049173355, "Train": {"Loss": 3.443457829969901, "avg t": 1.0219033309088812, "plain loss": 0.23136511917114255, "standard loss": 0.11133332935844859}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.91666412353516, "Augmented-0.05-Quantile-Accuracy": 97.06666564941406, "Augmented-0.1-Quantile-Accuracy": 97.63333129882812, "Augmented-Accuracy": 98.68233333333333, "Augmented-Loss": 0.0922656672586004, "Clean-Accuracy": 98.98333333333333, "Clean-Loss": 0.0477040908181419, "PGD-Accuracy": 10.366666666666667, "PGD-Loss": 7.6501565984090165}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 94, "Epoch-Time": 234.6495258808136, "Test": {"Augmented-0.01-Quantile-Accuracy": 92.61000061035156, "Augmented-0.05-Quantile-Accuracy": 95.55999755859375, "Augmented-0.1-Quantile-Accuracy": 96.39999389648438, "Augmented-Accuracy": 98.2802, "Augmented-Loss": 0.1439152361137867, "Clean-Accuracy": 98.85, "Clean-Loss": 0.05205086427927017, "PGD-Accuracy": 11.21, "PGD-Loss": 5.371841772460938}, "Total-Time": 21979.530017614365, "Train": {"Loss": 3.4228960927680685, "avg t": 1.0209746560343989, "plain loss": 0.22912390526312362, "standard loss": 0.10767048050490795}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 93.54999542236328, "Augmented-0.05-Quantile-Accuracy": 96.31666564941406, "Augmented-0.1-Quantile-Accuracy": 97.18333435058594, "Augmented-Accuracy": 98.435, "Augmented-Loss": 0.12725499082138142, "Clean-Accuracy": 98.93333333333334, "Clean-Loss": 0.052401647473375, "PGD-Accuracy": 10.5, "PGD-Loss": 5.348289042154948}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 95, "Epoch-Time": 241.8617033958435, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.5999984741211, "Augmented-0.05-Quantile-Accuracy": 96.8699951171875, "Augmented-0.1-Quantile-Accuracy": 97.40999603271484, "Augmented-Accuracy": 98.7064, "Augmented-Loss": 0.081724245418787, "Clean-Accuracy": 98.99, "Clean-Loss": 0.042281365748494865, "PGD-Accuracy": 11.24, "PGD-Loss": 7.136027108764648}, "Total-Time": 22221.391721010208, "Train": {"Loss": 2.9343205610204626, "avg t": 1.0180041217450742, "plain loss": 0.2161586633011148, "standard loss": 0.10293092037958128}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.61666870117188, "Augmented-0.05-Quantile-Accuracy": 97.23332977294922, "Augmented-0.1-Quantile-Accuracy": 98.01666259765625, "Augmented-Accuracy": 98.85783333333333, "Augmented-Loss": 0.07419083337634802, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.04328183311099808, "PGD-Accuracy": 10.65, "PGD-Loss": 6.860121241251628}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 96, "Epoch-Time": 241.74103212356567, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.73999786376953, "Augmented-0.05-Quantile-Accuracy": 96.93999481201172, "Augmented-0.1-Quantile-Accuracy": 97.5199966430664, "Augmented-Accuracy": 98.7418, "Augmented-Loss": 0.08372160483324528, "Clean-Accuracy": 99.01, "Clean-Loss": 0.04363843506127596, "PGD-Accuracy": 11.02, "PGD-Loss": 6.233448336791993}, "Total-Time": 22463.132753133774, "Train": {"Loss": 2.8116112524668377, "avg t": 1.0165590986675686, "plain loss": 0.2134285815892396, "standard loss": 0.10343201603878427}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.6500015258789, "Augmented-0.05-Quantile-Accuracy": 97.29999542236328, "Augmented-0.1-Quantile-Accuracy": 97.96666717529297, "Augmented-Accuracy": 98.83933333333333, "Augmented-Loss": 0.07878389876946806, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.04582713415349523, "PGD-Accuracy": 10.033333333333333, "PGD-Loss": 6.043446080525716}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 97, "Epoch-Time": 241.69619584083557, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.2699966430664, "Augmented-0.05-Quantile-Accuracy": 97.12999725341797, "Augmented-0.1-Quantile-Accuracy": 97.70999908447266, "Augmented-Accuracy": 98.816, "Augmented-Loss": 0.0901081751613617, "Clean-Accuracy": 99.02, "Clean-Loss": 0.043950316049158576, "PGD-Accuracy": 10.83, "PGD-Loss": 6.104402508544922}, "Total-Time": 22704.82894897461, "Train": {"Loss": 2.742580497353165, "avg t": 1.013837696146082, "plain loss": 0.20466655328891917, "standard loss": 0.09934951447861062}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.03333282470703, "Augmented-0.05-Quantile-Accuracy": 97.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.01666259765625, "Augmented-Accuracy": 98.88083333333333, "Augmented-Loss": 0.08271357273807128, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.042491056176523365, "PGD-Accuracy": 10.383333333333333, "PGD-Loss": 5.9206282399495445}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 98, "Epoch-Time": 206.27611565589905, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.8699951171875, "Augmented-0.05-Quantile-Accuracy": 96.94999694824219, "Augmented-0.1-Quantile-Accuracy": 97.58999633789062, "Augmented-Accuracy": 98.7527, "Augmented-Loss": 0.13445638673830032, "Clean-Accuracy": 99.06, "Clean-Loss": 0.05275572086572647, "PGD-Accuracy": 11.33, "PGD-Loss": 4.424452268981933}, "Total-Time": 22911.10506463051, "Train": {"Loss": 2.6306030009234393, "avg t": 1.013299308847498, "plain loss": 0.20214735301159015, "standard loss": 0.10181122657960212}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.54999542236328, "Augmented-0.05-Quantile-Accuracy": 97.31666564941406, "Augmented-0.1-Quantile-Accuracy": 97.86666870117188, "Augmented-Accuracy": 98.86, "Augmented-Loss": 0.1238164825383822, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.051910956313212714, "PGD-Accuracy": 10.6, "PGD-Loss": 4.262501248677571}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 99, "Epoch-Time": 219.9459524154663, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.22999572753906, "Augmented-0.05-Quantile-Accuracy": 96.12999725341797, "Augmented-0.1-Quantile-Accuracy": 96.91999816894531, "Augmented-Accuracy": 98.4512, "Augmented-Loss": 0.1713983748254776, "Clean-Accuracy": 98.97, "Clean-Loss": 0.0754678407073021, "PGD-Accuracy": 11.14, "PGD-Loss": 5.413471005249024}, "Total-Time": 23131.051017045975, "Train": {"Loss": 2.1865957275673193, "avg t": 1.0103751189620407, "plain loss": 0.1866306259755733, "standard loss": 0.09239561795029376}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.21666717529297, "Augmented-0.05-Quantile-Accuracy": 96.5, "Augmented-0.1-Quantile-Accuracy": 97.33333587646484, "Augmented-Accuracy": 98.5425, "Augmented-Loss": 0.168878791021506, "Clean-Accuracy": 98.95, "Clean-Loss": 0.07842816011110941, "PGD-Accuracy": 10.65, "PGD-Loss": 5.222349700927734}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 100, "Epoch-Time": 241.56819772720337, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.94999694824219, "Augmented-0.05-Quantile-Accuracy": 97.37999725341797, "Augmented-0.1-Quantile-Accuracy": 97.8499984741211, "Augmented-Accuracy": 98.7159, "Augmented-Loss": 0.05746013714215532, "Clean-Accuracy": 98.82, "Clean-Loss": 0.06355866695937003, "PGD-Accuracy": 7.59, "PGD-Loss": 18.532008325195314}, "Total-Time": 23372.619214773178, "Train": {"Loss": 2.220513071272108, "avg t": 1.0102276944054498, "plain loss": 0.1903826612119321, "standard loss": 0.09833580861958088}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.58333587646484, "Augmented-0.05-Quantile-Accuracy": 97.56666564941406, "Augmented-0.1-Quantile-Accuracy": 97.98332977294922, "Augmented-Accuracy": 98.80916666666667, "Augmented-Loss": 0.06313999534341778, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.0699478328456753, "PGD-Accuracy": 7.633333333333334, "PGD-Loss": 18.02033359781901}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 101, "Epoch-Time": 241.7466983795166, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.48999786376953, "Augmented-0.05-Quantile-Accuracy": 96.81999969482422, "Augmented-0.1-Quantile-Accuracy": 97.43999481201172, "Augmented-Accuracy": 98.6636, "Augmented-Loss": 0.157654347281456, "Clean-Accuracy": 99.03, "Clean-Loss": 0.06481270633935929, "PGD-Accuracy": 11.34, "PGD-Loss": 3.9580241790771487}, "Total-Time": 23614.365913152695, "Train": {"Loss": 2.687682004010236, "avg t": 1.0121252637086091, "plain loss": 0.19265752056439692, "standard loss": 0.09845955031034019}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.54999542236328, "Augmented-0.05-Quantile-Accuracy": 97.38333129882812, "Augmented-0.1-Quantile-Accuracy": 97.81666564941406, "Augmented-Accuracy": 98.7795, "Augmented-Loss": 0.1454128714509805, "Clean-Accuracy": 99.05, "Clean-Loss": 0.0624879713455836, "PGD-Accuracy": 10.516666666666667, "PGD-Loss": 3.7764352595011395}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 102, "Epoch-Time": 241.55652785301208, "Test": {"Augmented-0.01-Quantile-Accuracy": 92.75, "Augmented-0.05-Quantile-Accuracy": 95.5199966430664, "Augmented-0.1-Quantile-Accuracy": 96.6199951171875, "Augmented-Accuracy": 98.2645, "Augmented-Loss": 0.21662319050884246, "Clean-Accuracy": 99.04, "Clean-Loss": 0.07283332179784775, "PGD-Accuracy": 11.21, "PGD-Loss": 3.7428963317871093}, "Total-Time": 23855.922441005707, "Train": {"Loss": 2.1760051278714783, "avg t": 1.0095652714128847, "plain loss": 0.183963356480775, "standard loss": 0.09712156599042593}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.0, "Augmented-0.05-Quantile-Accuracy": 96.4000015258789, "Augmented-0.1-Quantile-Accuracy": 97.18333435058594, "Augmented-Accuracy": 98.40616666666666, "Augmented-Loss": 0.19741801003893217, "Clean-Accuracy": 98.85, "Clean-Loss": 0.06974921296040217, "PGD-Accuracy": 10.4, "PGD-Loss": 3.720153615315755}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 103, "Epoch-Time": 229.7169930934906, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.63999938964844, "Augmented-0.05-Quantile-Accuracy": 97.22000122070312, "Augmented-0.1-Quantile-Accuracy": 97.79000091552734, "Augmented-Accuracy": 98.8072, "Augmented-Loss": 0.1178949767203331, "Clean-Accuracy": 99.16, "Clean-Loss": 0.04847232591807842, "PGD-Accuracy": 11.8, "PGD-Loss": 4.476217184448243}, "Total-Time": 24085.639434099197, "Train": {"Loss": 2.4514073546021073, "avg t": 1.0109643358654445, "plain loss": 0.18519386502018673, "standard loss": 0.09619426163927548}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.88333129882812, "Augmented-0.05-Quantile-Accuracy": 97.6500015258789, "Augmented-0.1-Quantile-Accuracy": 97.94999694824219, "Augmented-Accuracy": 98.84933333333333, "Augmented-Loss": 0.1101098777492841, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.051163978869716326, "PGD-Accuracy": 11.333333333333334, "PGD-Loss": 4.4007494799296065}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 104, "Epoch-Time": 207.32973742485046, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.02999877929688, "Augmented-0.05-Quantile-Accuracy": 96.86000061035156, "Augmented-0.1-Quantile-Accuracy": 97.47000122070312, "Augmented-Accuracy": 98.5791, "Augmented-Loss": 0.07985262634438277, "Clean-Accuracy": 98.89, "Clean-Loss": 0.046492548312991856, "PGD-Accuracy": 10.78, "PGD-Loss": 5.375636740112305}, "Total-Time": 24292.969171524048, "Train": {"Loss": 2.1400966157559997, "avg t": 1.008867065359045, "plain loss": 0.18080989098195688, "standard loss": 0.09168581525926237}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.79999542236328, "Augmented-0.05-Quantile-Accuracy": 97.33333587646484, "Augmented-0.1-Quantile-Accuracy": 97.83333587646484, "Augmented-Accuracy": 98.8095, "Augmented-Loss": 0.07845915670722722, "Clean-Accuracy": 99.1, "Clean-Loss": 0.04777028899267316, "PGD-Accuracy": 10.033333333333333, "PGD-Loss": 5.232632853190104}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 105, "Epoch-Time": 235.95058488845825, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.88999938964844, "Augmented-0.05-Quantile-Accuracy": 97.40999603271484, "Augmented-0.1-Quantile-Accuracy": 97.87999725341797, "Augmented-Accuracy": 98.8365, "Augmented-Loss": 0.051020951549291614, "Clean-Accuracy": 98.92, "Clean-Loss": 0.0398242923989892, "PGD-Accuracy": 9.18, "PGD-Loss": 8.270811322021485}, "Total-Time": 24528.919756412506, "Train": {"Loss": 2.106035164161965, "avg t": 1.0088763247595893, "plain loss": 0.1781293187106098, "standard loss": 0.09617342654863993}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.73332977294922, "Augmented-0.05-Quantile-Accuracy": 97.9000015258789, "Augmented-0.1-Quantile-Accuracy": 98.26666259765625, "Augmented-Accuracy": 99.06783333333334, "Augmented-Loss": 0.04774204376836618, "Clean-Accuracy": 99.2, "Clean-Loss": 0.03644152772054076, "PGD-Accuracy": 9.0, "PGD-Loss": 7.883631306966146}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 106, "Epoch-Time": 241.72534346580505, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.5999984741211, "Augmented-0.05-Quantile-Accuracy": 97.62999725341797, "Augmented-0.1-Quantile-Accuracy": 98.07999420166016, "Augmented-Accuracy": 98.9439, "Augmented-Loss": 0.053335945639878514, "Clean-Accuracy": 99.1, "Clean-Loss": 0.03821401824578643, "PGD-Accuracy": 14.25, "PGD-Loss": 5.905933862304687}, "Total-Time": 24770.64509987831, "Train": {"Loss": 2.3966392738201, "avg t": 1.0110272216796874, "plain loss": 0.19060828276386943, "standard loss": 0.09992580551874858}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.01666259765625, "Augmented-0.1-Quantile-Accuracy": 98.36666870117188, "Augmented-Accuracy": 99.02733333333333, "Augmented-Loss": 0.05175634568770727, "Clean-Accuracy": 99.15, "Clean-Loss": 0.039101934605588515, "PGD-Accuracy": 14.533333333333333, "PGD-Loss": 5.532577084859212}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 107, "Epoch-Time": 241.63150334358215, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.93000030517578, "Augmented-0.05-Quantile-Accuracy": 96.94999694824219, "Augmented-0.1-Quantile-Accuracy": 97.69999694824219, "Augmented-Accuracy": 98.7227, "Augmented-Loss": 0.13015313514852525, "Clean-Accuracy": 99.1, "Clean-Loss": 0.05796137476563454, "PGD-Accuracy": 11.1, "PGD-Loss": 3.828159559631348}, "Total-Time": 25012.276603221893, "Train": {"Loss": 2.263254851023356, "avg t": 1.0098862109007658, "plain loss": 0.18301709870585675, "standard loss": 0.09625128365942726}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.01666259765625, "Augmented-0.05-Quantile-Accuracy": 97.5, "Augmented-0.1-Quantile-Accuracy": 98.03333282470703, "Augmented-Accuracy": 98.9015, "Augmented-Loss": 0.11607561704476674, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.05261375865340233, "PGD-Accuracy": 10.233333333333333, "PGD-Loss": 3.6775787099202475}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 108, "Epoch-Time": 241.7516016960144, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.30999755859375, "Augmented-0.05-Quantile-Accuracy": 97.18000030517578, "Augmented-0.1-Quantile-Accuracy": 97.66999816894531, "Augmented-Accuracy": 98.6709, "Augmented-Loss": 0.13448548770523072, "Clean-Accuracy": 98.73, "Clean-Loss": 0.08706883620023727, "PGD-Accuracy": 12.17, "PGD-Loss": 6.6028455596923825}, "Total-Time": 25254.028204917908, "Train": {"Loss": 2.222848346427635, "avg t": 1.0097765948684128, "plain loss": 0.18246219453988263, "standard loss": 0.09916241676056826}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.71666717529297, "Augmented-0.05-Quantile-Accuracy": 97.46666717529297, "Augmented-0.1-Quantile-Accuracy": 97.88333129882812, "Augmented-Accuracy": 98.67683333333333, "Augmented-Loss": 0.12792172357877096, "Clean-Accuracy": 98.76666666666667, "Clean-Loss": 0.08360829042394956, "PGD-Accuracy": 12.416666666666666, "PGD-Loss": 6.359971084594727}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 109, "Epoch-Time": 207.13103342056274, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.40999603271484, "Augmented-0.05-Quantile-Accuracy": 97.22999572753906, "Augmented-0.1-Quantile-Accuracy": 97.81999969482422, "Augmented-Accuracy": 98.7686, "Augmented-Loss": 0.08743430507528782, "Clean-Accuracy": 98.9, "Clean-Loss": 0.05093221673965454, "PGD-Accuracy": 11.15, "PGD-Loss": 5.126998089599609}, "Total-Time": 25461.15923833847, "Train": {"Loss": 2.083052118442677, "avg t": 1.0087338188665884, "plain loss": 0.1780434434784784, "standard loss": 0.0977918929187236}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.25, "Augmented-0.05-Quantile-Accuracy": 97.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.04999542236328, "Augmented-Accuracy": 98.88033333333334, "Augmented-Loss": 0.08145618139108023, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.04785129941006502, "PGD-Accuracy": 10.416666666666666, "PGD-Loss": 4.934478640238444}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 110, "Epoch-Time": 219.77636790275574, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.55999755859375, "Augmented-0.05-Quantile-Accuracy": 96.8699951171875, "Augmented-0.1-Quantile-Accuracy": 97.62999725341797, "Augmented-Accuracy": 98.748, "Augmented-Loss": 0.1858434450173378, "Clean-Accuracy": 99.14, "Clean-Loss": 0.08999682323932648, "PGD-Accuracy": 11.4, "PGD-Loss": 3.396858332824707}, "Total-Time": 25680.935606241226, "Train": {"Loss": 2.0990201345726294, "avg t": 1.0082219554759837, "plain loss": 0.1825284530286437, "standard loss": 0.10219636012006689}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.66666412353516, "Augmented-0.05-Quantile-Accuracy": 97.38333129882812, "Augmented-0.1-Quantile-Accuracy": 97.76666259765625, "Augmented-Accuracy": 98.788, "Augmented-Loss": 0.17023330302119255, "Clean-Accuracy": 99.1, "Clean-Loss": 0.08345694567759832, "PGD-Accuracy": 10.733333333333333, "PGD-Loss": 3.314337520599365}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 111, "Epoch-Time": 241.5081377029419, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.75, "Augmented-0.05-Quantile-Accuracy": 96.97000122070312, "Augmented-0.1-Quantile-Accuracy": 97.65999603271484, "Augmented-Accuracy": 98.6902, "Augmented-Loss": 0.15261262669038772, "Clean-Accuracy": 99.04, "Clean-Loss": 0.08349947032928466, "PGD-Accuracy": 12.63, "PGD-Loss": 4.19042321472168}, "Total-Time": 25922.443743944168, "Train": {"Loss": 2.315834220674303, "avg t": 1.0094498200946385, "plain loss": 0.18372232289490878, "standard loss": 0.1044331786442134}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.5, "Augmented-0.05-Quantile-Accuracy": 97.51666259765625, "Augmented-0.1-Quantile-Accuracy": 97.96666717529297, "Augmented-Accuracy": 98.83783333333334, "Augmented-Loss": 0.13826237225472926, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.07793315492073695, "PGD-Accuracy": 11.783333333333333, "PGD-Loss": 4.066383814493815}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 112, "Epoch-Time": 241.527174949646, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.72000122070312, "Augmented-0.05-Quantile-Accuracy": 97.41999816894531, "Augmented-0.1-Quantile-Accuracy": 97.87999725341797, "Augmented-Accuracy": 98.9212, "Augmented-Loss": 0.09186487688064575, "Clean-Accuracy": 99.12, "Clean-Loss": 0.046569947397708894, "PGD-Accuracy": 12.27, "PGD-Loss": 4.896184527587891}, "Total-Time": 26163.970918893814, "Train": {"Loss": 2.039137894100613, "avg t": 1.0080063883463541, "plain loss": 0.17830399752722853, "standard loss": 0.10160049854301743}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.48332977294922, "Augmented-0.05-Quantile-Accuracy": 97.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.13333129882812, "Augmented-Accuracy": 98.9735, "Augmented-Loss": 0.08642831304132938, "Clean-Accuracy": 99.15, "Clean-Loss": 0.04910845806698005, "PGD-Accuracy": 11.966666666666667, "PGD-Loss": 4.6788398564656575}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 113, "Epoch-Time": 241.50601387023926, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.91999816894531, "Augmented-0.05-Quantile-Accuracy": 97.47000122070312, "Augmented-0.1-Quantile-Accuracy": 97.98999786376953, "Augmented-Accuracy": 98.8848, "Augmented-Loss": 0.08329491545283794, "Clean-Accuracy": 99.02, "Clean-Loss": 0.05282358811497688, "PGD-Accuracy": 14.55, "PGD-Loss": 5.303007049560547}, "Total-Time": 26405.476932764053, "Train": {"Loss": 2.4563627956531664, "avg t": 1.0089220904950742, "plain loss": 0.18549898244363303, "standard loss": 0.10255247086590087}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.88333129882812, "Augmented-0.05-Quantile-Accuracy": 97.94999694824219, "Augmented-0.1-Quantile-Accuracy": 98.3499984741211, "Augmented-Accuracy": 98.9605, "Augmented-Loss": 0.07614510436922312, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.05220343279341857, "PGD-Accuracy": 15.0, "PGD-Loss": 5.014174728393555}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 114, "Epoch-Time": 226.79576468467712, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.5, "Augmented-0.05-Quantile-Accuracy": 97.07999420166016, "Augmented-0.1-Quantile-Accuracy": 97.52999877929688, "Augmented-Accuracy": 98.6078, "Augmented-Loss": 0.05578250393052399, "Clean-Accuracy": 98.81, "Clean-Loss": 0.05404440057612955, "PGD-Accuracy": 11.15, "PGD-Loss": 17.84282498779297}, "Total-Time": 26632.27269744873, "Train": {"Loss": 1.9919852902447737, "avg t": 1.00667286212356, "plain loss": 0.1805464545797421, "standard loss": 0.10175217732676753}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.1500015258789, "Augmented-0.05-Quantile-Accuracy": 97.44999694824219, "Augmented-0.1-Quantile-Accuracy": 97.94999694824219, "Augmented-Accuracy": 98.79283333333333, "Augmented-Loss": 0.057632027411212525, "Clean-Accuracy": 98.9, "Clean-Loss": 0.055052915849722925, "PGD-Accuracy": 11.85, "PGD-Loss": 17.517249399820965}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 115, "Epoch-Time": 208.41919136047363, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.81999969482422, "Augmented-0.05-Quantile-Accuracy": 96.57999420166016, "Augmented-0.1-Quantile-Accuracy": 97.30999755859375, "Augmented-Accuracy": 98.5157, "Augmented-Loss": 0.13984526719236373, "Clean-Accuracy": 99.03, "Clean-Loss": 0.07496317150592804, "PGD-Accuracy": 14.91, "PGD-Loss": 4.112003984069824}, "Total-Time": 26840.691888809204, "Train": {"Loss": 1.8867725817362468, "avg t": 1.0066491351657443, "plain loss": 0.17731965051050536, "standard loss": 0.09903769835691761}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.01666259765625, "Augmented-0.05-Quantile-Accuracy": 97.31666564941406, "Augmented-0.1-Quantile-Accuracy": 97.81666564941406, "Augmented-Accuracy": 98.7575, "Augmented-Loss": 0.12304850812832514, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.06707116178671518, "PGD-Accuracy": 14.133333333333333, "PGD-Loss": 3.918566942850749}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 116, "Epoch-Time": 237.4935483932495, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.7699966430664, "Augmented-0.05-Quantile-Accuracy": 97.36000061035156, "Augmented-0.1-Quantile-Accuracy": 97.90999603271484, "Augmented-Accuracy": 98.8629, "Augmented-Loss": 0.11163937363028527, "Clean-Accuracy": 99.05, "Clean-Loss": 0.05519697118997574, "PGD-Accuracy": 11.14, "PGD-Loss": 4.2496893585205076}, "Total-Time": 27078.185437202454, "Train": {"Loss": 2.100012581012867, "avg t": 1.0073393358301233, "plain loss": 0.18377494877179468, "standard loss": 0.09992716771557375}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.0, "Augmented-0.1-Quantile-Accuracy": 98.25, "Augmented-Accuracy": 99.01266666666666, "Augmented-Loss": 0.10133717668930689, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05154591153065364, "PGD-Accuracy": 10.65, "PGD-Loss": 4.0150351816813155}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 117, "Epoch-Time": 241.6179232597351, "Test": {"Augmented-0.01-Quantile-Accuracy": 73.95999908447266, "Augmented-0.05-Quantile-Accuracy": 83.16999816894531, "Augmented-0.1-Quantile-Accuracy": 86.30999755859375, "Augmented-Accuracy": 92.8268, "Augmented-Loss": 0.7241281851997375, "Clean-Accuracy": 98.08, "Clean-Loss": 0.3398467451095581, "PGD-Accuracy": 11.13, "PGD-Loss": 2.6725618392944335}, "Total-Time": 27319.80336046219, "Train": {"Loss": 1.87327443935253, "avg t": 1.0066965889047694, "plain loss": 0.17183488515218112, "standard loss": 0.08712412372272875}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 77.91666412353516, "Augmented-0.05-Quantile-Accuracy": 85.83333587646484, "Augmented-0.1-Quantile-Accuracy": 88.5999984741211, "Augmented-Accuracy": 94.00966666666666, "Augmented-Loss": 0.6821667326800028, "Clean-Accuracy": 97.93333333333334, "Clean-Loss": 0.31564720010757447, "PGD-Accuracy": 10.35, "PGD-Loss": 2.6864720408121743}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 118, "Epoch-Time": 241.50306963920593, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.0, "Augmented-0.05-Quantile-Accuracy": 97.55999755859375, "Augmented-0.1-Quantile-Accuracy": 97.97000122070312, "Augmented-Accuracy": 98.9002, "Augmented-Loss": 0.08955678001189232, "Clean-Accuracy": 99.04, "Clean-Loss": 0.05058519114851952, "PGD-Accuracy": 11.23, "PGD-Loss": 5.922336950683594}, "Total-Time": 27561.306430101395, "Train": {"Loss": 1.756683578491211, "avg t": 1.005521868635107, "plain loss": 0.17665789462548714, "standard loss": 0.09312018707670547}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.68333435058594, "Augmented-0.05-Quantile-Accuracy": 97.91666412353516, "Augmented-0.1-Quantile-Accuracy": 98.28333282470703, "Augmented-Accuracy": 98.98316666666666, "Augmented-Loss": 0.08659579611579576, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.049805765464901924, "PGD-Accuracy": 10.5, "PGD-Loss": 5.542658688863119}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 119, "Epoch-Time": 241.7198088169098, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.47000122070312, "Augmented-0.05-Quantile-Accuracy": 97.81999969482422, "Augmented-0.1-Quantile-Accuracy": 98.22999572753906, "Augmented-Accuracy": 99.0446, "Augmented-Loss": 0.08042727255368233, "Clean-Accuracy": 99.15, "Clean-Loss": 0.04167683392763138, "PGD-Accuracy": 10.64, "PGD-Loss": 4.926124423217773}, "Total-Time": 27803.026238918304, "Train": {"Loss": 1.8080970769458347, "avg t": 1.0057384967803955, "plain loss": 0.17574318626191882, "standard loss": 0.09443204288791728}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.0, "Augmented-0.05-Quantile-Accuracy": 98.25, "Augmented-0.1-Quantile-Accuracy": 98.46666717529297, "Augmented-Accuracy": 99.09333333333333, "Augmented-Loss": 0.07420136520008246, "Clean-Accuracy": 99.15, "Clean-Loss": 0.041673995221654575, "PGD-Accuracy": 10.066666666666666, "PGD-Loss": 4.627403978983561}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 120, "Epoch-Time": 205.28772044181824, "Test": {"Augmented-0.01-Quantile-Accuracy": 89.83999633789062, "Augmented-0.05-Quantile-Accuracy": 93.97000122070312, "Augmented-0.1-Quantile-Accuracy": 95.22999572753906, "Augmented-Accuracy": 97.5867, "Augmented-Loss": 0.3775500866250992, "Clean-Accuracy": 98.81, "Clean-Loss": 0.17021254081726075, "PGD-Accuracy": 10.98, "PGD-Loss": 3.2602534133911134}, "Total-Time": 28008.313959360123, "Train": {"Loss": 2.204699541586417, "avg t": 1.0072545075946384, "plain loss": 0.17823287008426794, "standard loss": 0.0913639823777808}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 92.16666412353516, "Augmented-0.05-Quantile-Accuracy": 95.38333129882812, "Augmented-0.1-Quantile-Accuracy": 96.25, "Augmented-Accuracy": 98.00433333333334, "Augmented-Loss": 0.33902530517101287, "Clean-Accuracy": 99.0, "Clean-Loss": 0.1473805976311366, "PGD-Accuracy": 10.45, "PGD-Loss": 3.1069121182759605}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 121, "Epoch-Time": 220.88446688652039, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.29000091552734, "Augmented-0.05-Quantile-Accuracy": 97.68999481201172, "Augmented-0.1-Quantile-Accuracy": 98.2699966430664, "Augmented-Accuracy": 99.018, "Augmented-Loss": 0.09087080250716209, "Clean-Accuracy": 99.2, "Clean-Loss": 0.04564313336312771, "PGD-Accuracy": 11.73, "PGD-Loss": 4.841001196289063}, "Total-Time": 28229.198426246643, "Train": {"Loss": 1.8048035810611867, "avg t": 1.0058584330876668, "plain loss": 0.17733862018585214, "standard loss": 0.0903002250045538}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.93333435058594, "Augmented-0.05-Quantile-Accuracy": 97.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.19999694824219, "Augmented-Accuracy": 98.95916666666666, "Augmented-Loss": 0.08773568090726933, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.048702835738658905, "PGD-Accuracy": 11.133333333333333, "PGD-Loss": 4.663554328918457}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 122, "Epoch-Time": 241.28684401512146, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.48999786376953, "Augmented-0.05-Quantile-Accuracy": 95.91999816894531, "Augmented-0.1-Quantile-Accuracy": 96.64999389648438, "Augmented-Accuracy": 98.3282, "Augmented-Loss": 0.22939989859962465, "Clean-Accuracy": 98.82, "Clean-Loss": 0.11013598086833953, "PGD-Accuracy": 11.25, "PGD-Loss": 3.701113781738281}, "Total-Time": 28470.485270261765, "Train": {"Loss": 1.784122050885801, "avg t": 1.0051989037019236, "plain loss": 0.1769197292398523, "standard loss": 0.09046168738272455}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.43333435058594, "Augmented-0.05-Quantile-Accuracy": 96.66666412353516, "Augmented-0.1-Quantile-Accuracy": 97.5, "Augmented-Accuracy": 98.61566666666667, "Augmented-Loss": 0.20343816145737967, "Clean-Accuracy": 99.0, "Clean-Loss": 0.09658273496230443, "PGD-Accuracy": 10.516666666666667, "PGD-Loss": 3.6705815099080406}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 123, "Epoch-Time": 241.60085701942444, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.48999786376953, "Augmented-0.05-Quantile-Accuracy": 97.66999816894531, "Augmented-0.1-Quantile-Accuracy": 98.08999633789062, "Augmented-Accuracy": 98.9941, "Augmented-Loss": 0.08111785462987423, "Clean-Accuracy": 99.07, "Clean-Loss": 0.04362656479179859, "PGD-Accuracy": 13.13, "PGD-Loss": 5.004498425292969}, "Total-Time": 28712.08612728119, "Train": {"Loss": 1.709321796876413, "avg t": 1.0048795075769779, "plain loss": 0.17594204815405376, "standard loss": 0.09083730938037236}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.41666412353516, "Augmented-Accuracy": 99.019, "Augmented-Loss": 0.07394431129276753, "Clean-Accuracy": 99.1, "Clean-Loss": 0.04095498838524024, "PGD-Accuracy": 13.016666666666667, "PGD-Loss": 4.826111147562663}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 124, "Epoch-Time": 241.43789267539978, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.16999816894531, "Augmented-0.05-Quantile-Accuracy": 96.97999572753906, "Augmented-0.1-Quantile-Accuracy": 97.50999450683594, "Augmented-Accuracy": 98.7287, "Augmented-Loss": 0.15670338499403, "Clean-Accuracy": 98.9, "Clean-Loss": 0.08334974277019501, "PGD-Accuracy": 11.03, "PGD-Loss": 5.199392736816407}, "Total-Time": 28953.52401995659, "Train": {"Loss": 2.102937679114165, "avg t": 1.0077392684088813, "plain loss": 0.17862657732963555, "standard loss": 0.09464939995268705}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.08333587646484, "Augmented-0.05-Quantile-Accuracy": 97.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.06666564941406, "Augmented-Accuracy": 98.887, "Augmented-Loss": 0.1356315035390854, "Clean-Accuracy": 99.05, "Clean-Loss": 0.07372370298703512, "PGD-Accuracy": 10.6, "PGD-Loss": 5.114738929748535}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 125, "Epoch-Time": 223.35169649124146, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.36000061035156, "Augmented-0.05-Quantile-Accuracy": 97.18999481201172, "Augmented-0.1-Quantile-Accuracy": 97.91999816894531, "Augmented-Accuracy": 98.8575, "Augmented-Loss": 0.16224308034467697, "Clean-Accuracy": 99.16, "Clean-Loss": 0.06981878821849823, "PGD-Accuracy": 11.05, "PGD-Loss": 4.225886544799804}, "Total-Time": 29176.87571644783, "Train": {"Loss": 2.136505469498811, "avg t": 1.0080128505141648, "plain loss": 0.18061687237068447, "standard loss": 0.09345169741632761}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.03333282470703, "Augmented-0.05-Quantile-Accuracy": 97.54999542236328, "Augmented-0.1-Quantile-Accuracy": 97.9000015258789, "Augmented-Accuracy": 98.85333333333334, "Augmented-Loss": 0.14806841831008594, "Clean-Accuracy": 99.05, "Clean-Loss": 0.0672325499455134, "PGD-Accuracy": 10.45, "PGD-Loss": 4.136097244262695}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 126, "Epoch-Time": 208.6057891845703, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.43999481201172, "Augmented-0.05-Quantile-Accuracy": 96.63999938964844, "Augmented-0.1-Quantile-Accuracy": 97.39999389648438, "Augmented-Accuracy": 98.7712, "Augmented-Loss": 0.2158855180950165, "Clean-Accuracy": 99.06, "Clean-Loss": 0.10482716131210328, "PGD-Accuracy": 10.89, "PGD-Loss": 3.9525552215576174}, "Total-Time": 29385.4815056324, "Train": {"Loss": 2.055014211901912, "avg t": 1.0068638826299596, "plain loss": 0.17411308835700715, "standard loss": 0.08825121870305803}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.18333435058594, "Augmented-0.05-Quantile-Accuracy": 97.18333435058594, "Augmented-0.1-Quantile-Accuracy": 97.8499984741211, "Augmented-Accuracy": 98.76066666666667, "Augmented-Loss": 0.2001974359850089, "Clean-Accuracy": 99.03333333333333, "Clean-Loss": 0.10032407283782958, "PGD-Accuracy": 10.1, "PGD-Loss": 3.8018064931233724}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 127, "Epoch-Time": 238.20330715179443, "Test": {"Augmented-0.01-Quantile-Accuracy": 92.66999816894531, "Augmented-0.05-Quantile-Accuracy": 95.5, "Augmented-0.1-Quantile-Accuracy": 96.54999542236328, "Augmented-Accuracy": 98.1841, "Augmented-Loss": 0.20523630154800415, "Clean-Accuracy": 98.86, "Clean-Loss": 0.0709181429862976, "PGD-Accuracy": 10.95, "PGD-Loss": 3.6257290710449217}, "Total-Time": 29623.684812784195, "Train": {"Loss": 1.862665972744977, "avg t": 1.0058429045147366, "plain loss": 0.17557279372745074, "standard loss": 0.08943011889855067}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 93.71666717529297, "Augmented-0.05-Quantile-Accuracy": 96.26666259765625, "Augmented-0.1-Quantile-Accuracy": 96.96666717529297, "Augmented-Accuracy": 98.248, "Augmented-Loss": 0.18401765907645226, "Clean-Accuracy": 98.88333333333334, "Clean-Loss": 0.06464551094174385, "PGD-Accuracy": 10.266666666666667, "PGD-Loss": 3.5140534922281903}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 128, "Epoch-Time": 241.28257250785828, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.07999420166016, "Augmented-0.05-Quantile-Accuracy": 97.6199951171875, "Augmented-0.1-Quantile-Accuracy": 98.0199966430664, "Augmented-Accuracy": 98.9448, "Augmented-Loss": 0.06608114115989208, "Clean-Accuracy": 99.11, "Clean-Loss": 0.03918183629363775, "PGD-Accuracy": 11.71, "PGD-Loss": 5.271064263916015}, "Total-Time": 29864.967385292053, "Train": {"Loss": 1.9793616238346807, "avg t": 1.006758462022852, "plain loss": 0.17414436820877946, "standard loss": 0.08743992211807657}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.81666564941406, "Augmented-0.05-Quantile-Accuracy": 97.94999694824219, "Augmented-0.1-Quantile-Accuracy": 98.29999542236328, "Augmented-Accuracy": 98.99366666666667, "Augmented-Loss": 0.05944802629406253, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.037917854669193424, "PGD-Accuracy": 11.683333333333334, "PGD-Loss": 5.065583521525065}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 129, "Epoch-Time": 241.45537900924683, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.1199951171875, "Augmented-0.05-Quantile-Accuracy": 97.47999572753906, "Augmented-0.1-Quantile-Accuracy": 97.98999786376953, "Augmented-Accuracy": 98.9367, "Augmented-Loss": 0.1177664702887535, "Clean-Accuracy": 99.12, "Clean-Loss": 0.06232575296163559, "PGD-Accuracy": 15.97, "PGD-Loss": 4.12170601348877}, "Total-Time": 30106.4227643013, "Train": {"Loss": 2.3443708775838217, "avg t": 1.0081641332838271, "plain loss": 0.18021039393213054, "standard loss": 0.09403595775917724}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.71666717529297, "Augmented-0.05-Quantile-Accuracy": 97.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.25, "Augmented-Accuracy": 98.99966666666667, "Augmented-Loss": 0.10879306617339451, "Clean-Accuracy": 99.1, "Clean-Loss": 0.059611726740996046, "PGD-Accuracy": 14.85, "PGD-Loss": 3.914872797648112}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 130, "Epoch-Time": 241.36563634872437, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.64999389648438, "Augmented-0.05-Quantile-Accuracy": 96.40999603271484, "Augmented-0.1-Quantile-Accuracy": 97.12999725341797, "Augmented-Accuracy": 98.4637, "Augmented-Loss": 0.22640321803092955, "Clean-Accuracy": 98.95, "Clean-Loss": 0.09581250863075257, "PGD-Accuracy": 11.18, "PGD-Loss": 3.4505315338134768}, "Total-Time": 30347.788400650024, "Train": {"Loss": 2.437105706144262, "avg t": 1.0075930974041973, "plain loss": 0.18329294771441695, "standard loss": 0.093127571667786}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.16666412353516, "Augmented-0.05-Quantile-Accuracy": 97.18333435058594, "Augmented-0.1-Quantile-Accuracy": 97.5999984741211, "Augmented-Accuracy": 98.59283333333333, "Augmented-Loss": 0.20627763775110244, "Clean-Accuracy": 98.9, "Clean-Loss": 0.0876117415825526, "PGD-Accuracy": 10.6, "PGD-Loss": 3.3028784879048665}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 131, "Epoch-Time": 206.7435326576233, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.95999908447266, "Augmented-0.05-Quantile-Accuracy": 97.0, "Augmented-0.1-Quantile-Accuracy": 97.62999725341797, "Augmented-Accuracy": 98.7719, "Augmented-Loss": 0.17195338591098785, "Clean-Accuracy": 99.1, "Clean-Loss": 0.0785657870054245, "PGD-Accuracy": 11.28, "PGD-Loss": 3.5951544158935547}, "Total-Time": 30554.531933307648, "Train": {"Loss": 1.7579041712725605, "avg t": 1.005078292246218, "plain loss": 0.17334265845440064, "standard loss": 0.08533281540870666}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.11666870117188, "Augmented-0.05-Quantile-Accuracy": 97.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.1500015258789, "Augmented-Accuracy": 98.8695, "Augmented-Loss": 0.14745695350289345, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.06771375954151154, "PGD-Accuracy": 10.866666666666667, "PGD-Loss": 3.4487102762858073}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 132, "Epoch-Time": 222.02688217163086, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.55999755859375, "Augmented-0.05-Quantile-Accuracy": 97.22999572753906, "Augmented-0.1-Quantile-Accuracy": 97.72999572753906, "Augmented-Accuracy": 98.7519, "Augmented-Loss": 0.09940512537646294, "Clean-Accuracy": 98.98, "Clean-Loss": 0.05429802187979221, "PGD-Accuracy": 10.06, "PGD-Loss": 6.651630911254883}, "Total-Time": 30776.55881547928, "Train": {"Loss": 5.06052861905981, "avg t": 1.0218633521751121, "plain loss": 0.24665393879501915, "standard loss": 0.14914715970555942}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.28333282470703, "Augmented-0.05-Quantile-Accuracy": 97.58333587646484, "Augmented-0.1-Quantile-Accuracy": 97.98332977294922, "Augmented-Accuracy": 98.90316666666666, "Augmented-Loss": 0.10018162344773611, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.057435951766868436, "PGD-Accuracy": 9.8, "PGD-Loss": 6.241420873006185}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 133, "Epoch-Time": 241.16935849189758, "Test": {"Augmented-0.01-Quantile-Accuracy": 90.54000091552734, "Augmented-0.05-Quantile-Accuracy": 94.69999694824219, "Augmented-0.1-Quantile-Accuracy": 95.90999603271484, "Augmented-Accuracy": 97.9227, "Augmented-Loss": 0.21936514520978928, "Clean-Accuracy": 98.85, "Clean-Loss": 0.06060533882379532, "PGD-Accuracy": 10.92, "PGD-Loss": 3.9943068908691406}, "Total-Time": 31017.728173971176, "Train": {"Loss": 2.3886393465112756, "avg t": 1.0097086934690123, "plain loss": 0.19151025295257584, "standard loss": 0.09811316015819709}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 92.5, "Augmented-0.05-Quantile-Accuracy": 95.5999984741211, "Augmented-0.1-Quantile-Accuracy": 96.44999694824219, "Augmented-Accuracy": 98.181, "Augmented-Loss": 0.19311410660465558, "Clean-Accuracy": 98.88333333333334, "Clean-Loss": 0.05687297380963961, "PGD-Accuracy": 10.216666666666667, "PGD-Loss": 3.8403578084309897}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 134, "Epoch-Time": 241.25793051719666, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.75, "Augmented-0.05-Quantile-Accuracy": 97.36000061035156, "Augmented-0.1-Quantile-Accuracy": 97.91999816894531, "Augmented-Accuracy": 98.8752, "Augmented-Loss": 0.09132374379062652, "Clean-Accuracy": 99.02, "Clean-Loss": 0.04369543939679861, "PGD-Accuracy": 10.94, "PGD-Loss": 5.031176290893555}, "Total-Time": 31258.986104488373, "Train": {"Loss": 1.9964547661675347, "avg t": 1.0065704797108967, "plain loss": 0.17879197714770292, "standard loss": 0.08681166926081534}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.53333282470703, "Augmented-0.05-Quantile-Accuracy": 97.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.23332977294922, "Augmented-Accuracy": 98.91683333333333, "Augmented-Loss": 0.08329812014460564, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.041979450337588785, "PGD-Accuracy": 10.133333333333333, "PGD-Loss": 4.80800412495931}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 135, "Epoch-Time": 241.42388916015625, "Test": {"Augmented-0.01-Quantile-Accuracy": 87.11000061035156, "Augmented-0.05-Quantile-Accuracy": 92.29999542236328, "Augmented-0.1-Quantile-Accuracy": 93.81999969482422, "Augmented-Accuracy": 96.81, "Augmented-Loss": 0.18539102405548097, "Clean-Accuracy": 97.91, "Clean-Loss": 0.09843466905355454, "PGD-Accuracy": 7.03, "PGD-Loss": 11.394346380615234}, "Total-Time": 31500.40999364853, "Train": {"Loss": 1.962268758915089, "avg t": 1.006162348959181, "plain loss": 0.17465622782177398, "standard loss": 0.08469879253222434}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 89.08333587646484, "Augmented-0.05-Quantile-Accuracy": 93.51666259765625, "Augmented-0.1-Quantile-Accuracy": 94.88333129882812, "Augmented-Accuracy": 97.21816666666666, "Augmented-Loss": 0.16389866842865944, "Clean-Accuracy": 98.13333333333334, "Clean-Loss": 0.09042336871971687, "PGD-Accuracy": 6.133333333333334, "PGD-Loss": 11.708792663574219}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 136, "Epoch-Time": 221.4027087688446, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.65999603271484, "Augmented-0.05-Quantile-Accuracy": 97.45999908447266, "Augmented-0.1-Quantile-Accuracy": 97.87999725341797, "Augmented-Accuracy": 98.8635, "Augmented-Loss": 0.1121366677520275, "Clean-Accuracy": 98.98, "Clean-Loss": 0.05339319320321083, "PGD-Accuracy": 11.15, "PGD-Loss": 4.032384651184082}, "Total-Time": 31721.812702417374, "Train": {"Loss": 1.8637008426807544, "avg t": 1.0057535430060494, "plain loss": 0.17234900997832964, "standard loss": 0.08669308144626794}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.44999694824219, "Augmented-0.05-Quantile-Accuracy": 97.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.0999984741211, "Augmented-Accuracy": 98.8675, "Augmented-Loss": 0.09851980257014434, "Clean-Accuracy": 99.0, "Clean-Loss": 0.04923204299807549, "PGD-Accuracy": 10.45, "PGD-Loss": 3.9287441380818686}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 137, "Epoch-Time": 209.47518372535706, "Test": {"Augmented-0.01-Quantile-Accuracy": 92.54999542236328, "Augmented-0.05-Quantile-Accuracy": 95.50999450683594, "Augmented-0.1-Quantile-Accuracy": 96.5, "Augmented-Accuracy": 98.211, "Augmented-Loss": 0.18804993299770356, "Clean-Accuracy": 98.83, "Clean-Loss": 0.07024692542552947, "PGD-Accuracy": 11.05, "PGD-Loss": 3.833925259399414}, "Total-Time": 31931.28788614273, "Train": {"Loss": 7.0837789732615155, "avg t": 1.0149445634418064, "plain loss": 0.23885691658302616, "standard loss": 0.12334680637179149}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 93.5, "Augmented-0.05-Quantile-Accuracy": 96.28333282470703, "Augmented-0.1-Quantile-Accuracy": 96.88333129882812, "Augmented-Accuracy": 98.35116666666667, "Augmented-Loss": 0.17313946270982425, "Clean-Accuracy": 98.9, "Clean-Loss": 0.06656064825256666, "PGD-Accuracy": 10.616666666666667, "PGD-Loss": 3.700412259419759}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 138, "Epoch-Time": 239.5594925880432, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.08999633789062, "Augmented-0.05-Quantile-Accuracy": 96.40999603271484, "Augmented-0.1-Quantile-Accuracy": 97.11000061035156, "Augmented-Accuracy": 98.5054, "Augmented-Loss": 0.16935605805826187, "Clean-Accuracy": 98.97, "Clean-Loss": 0.06046610743999481, "PGD-Accuracy": 10.52, "PGD-Loss": 3.9169890167236328}, "Total-Time": 32170.847378730774, "Train": {"Loss": 2.8050906896237975, "avg t": 1.011635342809889, "plain loss": 0.19334009872542487, "standard loss": 0.0914678797953055}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.25, "Augmented-0.05-Quantile-Accuracy": 97.16666412353516, "Augmented-0.1-Quantile-Accuracy": 97.75, "Augmented-Accuracy": 98.773, "Augmented-Loss": 0.15395184107224147, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.05554077888528506, "PGD-Accuracy": 9.933333333333334, "PGD-Loss": 3.724237030029297}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 139, "Epoch-Time": 241.26928853988647, "Test": {"Augmented-0.01-Quantile-Accuracy": 91.98999786376953, "Augmented-0.05-Quantile-Accuracy": 95.38999938964844, "Augmented-0.1-Quantile-Accuracy": 96.36000061035156, "Augmented-Accuracy": 98.2324, "Augmented-Loss": 0.16315099169540406, "Clean-Accuracy": 98.91, "Clean-Loss": 0.04636615474224091, "PGD-Accuracy": 10.91, "PGD-Loss": 4.390676876831055}, "Total-Time": 32412.11666727066, "Train": {"Loss": 4.754066050988657, "avg t": 1.0129126865245677, "plain loss": 0.21410428539382098, "standard loss": 0.10983604781674566}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 93.61666870117188, "Augmented-0.05-Quantile-Accuracy": 96.19999694824219, "Augmented-0.1-Quantile-Accuracy": 96.96666717529297, "Augmented-Accuracy": 98.4575, "Augmented-Loss": 0.1490151033961773, "Clean-Accuracy": 98.9, "Clean-Loss": 0.04528372393548489, "PGD-Accuracy": 10.2, "PGD-Loss": 4.222579432169597}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 140, "Epoch-Time": 241.53661179542542, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.8699951171875, "Augmented-0.05-Quantile-Accuracy": 97.2699966430664, "Augmented-0.1-Quantile-Accuracy": 97.72999572753906, "Augmented-Accuracy": 98.62, "Augmented-Loss": 0.05994262472052075, "Clean-Accuracy": 98.76, "Clean-Loss": 0.06713351351206648, "PGD-Accuracy": 7.38, "PGD-Loss": 18.765616845703125}, "Total-Time": 32653.653279066086, "Train": {"Loss": 2.751562343173557, "avg t": 1.0116473027335273, "plain loss": 0.19146914383570343, "standard loss": 0.08715661723856573}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.69999694824219, "Augmented-0.05-Quantile-Accuracy": 97.93333435058594, "Augmented-0.1-Quantile-Accuracy": 98.21666717529297, "Augmented-Accuracy": 98.916, "Augmented-Loss": 0.06150459220046197, "Clean-Accuracy": 99.0, "Clean-Loss": 0.07107808645138812, "PGD-Accuracy": 7.383333333333334, "PGD-Loss": 18.657386423746743}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 141, "Epoch-Time": 241.425461769104, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.82999420166016, "Augmented-0.05-Quantile-Accuracy": 97.48999786376953, "Augmented-0.1-Quantile-Accuracy": 97.94999694824219, "Augmented-Accuracy": 98.8252, "Augmented-Loss": 0.048943489116698505, "Clean-Accuracy": 98.96, "Clean-Loss": 0.04130805176533758, "PGD-Accuracy": 9.9, "PGD-Loss": 10.050244506835938}, "Total-Time": 32895.07874083519, "Train": {"Loss": 2.658820277178729, "avg t": 1.0110525400020458, "plain loss": 0.1875566435955189, "standard loss": 0.08821882928963061}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.66666412353516, "Augmented-0.05-Quantile-Accuracy": 97.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.16666412353516, "Augmented-Accuracy": 98.891, "Augmented-Loss": 0.05070227094321201, "Clean-Accuracy": 98.95, "Clean-Loss": 0.045923799047479404, "PGD-Accuracy": 9.916666666666666, "PGD-Loss": 9.886695231119791}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 142, "Epoch-Time": 206.1755542755127, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.66999816894531, "Augmented-0.05-Quantile-Accuracy": 96.19999694824219, "Augmented-0.1-Quantile-Accuracy": 97.1199951171875, "Augmented-Accuracy": 98.4447, "Augmented-Loss": 0.17868978160762786, "Clean-Accuracy": 98.93, "Clean-Loss": 0.05329890058934689, "PGD-Accuracy": 10.8, "PGD-Loss": 4.47442155456543}, "Total-Time": 33101.2542951107, "Train": {"Loss": 3.41978125, "avg t": 1.0155754951900906, "plain loss": 0.21222106207653343, "standard loss": 0.09581165198443664}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.69999694824219, "Augmented-0.05-Quantile-Accuracy": 96.78333282470703, "Augmented-0.1-Quantile-Accuracy": 97.33333587646484, "Augmented-Accuracy": 98.49316666666667, "Augmented-Loss": 0.15426118546863396, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.052445882273217045, "PGD-Accuracy": 10.066666666666666, "PGD-Loss": 4.30460664621989}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 143, "Epoch-Time": 223.8862738609314, "Test": {"Augmented-0.01-Quantile-Accuracy": 85.7699966430664, "Augmented-0.05-Quantile-Accuracy": 92.02999877929688, "Augmented-0.1-Quantile-Accuracy": 93.83999633789062, "Augmented-Accuracy": 96.9525, "Augmented-Loss": 0.339110099981308, "Clean-Accuracy": 98.72, "Clean-Loss": 0.08270529541969299, "PGD-Accuracy": 10.85, "PGD-Loss": 3.746178689575195}, "Total-Time": 33325.140568971634, "Train": {"Loss": 8.67043195187604, "avg t": 1.0318023953614412, "plain loss": 0.29357575137526937, "standard loss": 0.1536373561521371}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 87.76666259765625, "Augmented-0.05-Quantile-Accuracy": 93.5999984741211, "Augmented-0.1-Quantile-Accuracy": 95.0, "Augmented-Accuracy": 97.45933333333333, "Augmented-Loss": 0.3017954660542806, "Clean-Accuracy": 98.75, "Clean-Loss": 0.07080072144667307, "PGD-Accuracy": 10.083333333333334, "PGD-Loss": 3.5664752502441406}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 144, "Epoch-Time": 241.572523355484, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.70999908447266, "Augmented-0.05-Quantile-Accuracy": 96.32999420166016, "Augmented-0.1-Quantile-Accuracy": 97.0999984741211, "Augmented-Accuracy": 98.5577, "Augmented-Loss": 0.10699617648530006, "Clean-Accuracy": 98.89, "Clean-Loss": 0.05039093796014786, "PGD-Accuracy": 10.28, "PGD-Loss": 5.9674404479980465}, "Total-Time": 33566.71309232712, "Train": {"Loss": 3.827921187012284, "avg t": 1.0226766236623128, "plain loss": 0.22385907379256384, "standard loss": 0.11168592058280828}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.21666717529297, "Augmented-0.05-Quantile-Accuracy": 97.08333587646484, "Augmented-0.1-Quantile-Accuracy": 97.68333435058594, "Augmented-Accuracy": 98.7405, "Augmented-Loss": 0.0991133372114102, "Clean-Accuracy": 98.98333333333333, "Clean-Loss": 0.048248055099820095, "PGD-Accuracy": 9.716666666666667, "PGD-Loss": 5.6801205851236976}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 145, "Epoch-Time": 241.33519983291626, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.02999877929688, "Augmented-0.05-Quantile-Accuracy": 97.30999755859375, "Augmented-0.1-Quantile-Accuracy": 97.66999816894531, "Augmented-Accuracy": 98.6449, "Augmented-Loss": 0.06909404593988715, "Clean-Accuracy": 98.85, "Clean-Loss": 0.07974671278467249, "PGD-Accuracy": 4.11, "PGD-Loss": 21.407728662109374}, "Total-Time": 33808.048292160034, "Train": {"Loss": 4.325423064196551, "avg t": 1.0229657346230967, "plain loss": 0.2379836595464636, "standard loss": 0.12297599043704018}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.48332977294922, "Augmented-0.05-Quantile-Accuracy": 97.86666870117188, "Augmented-0.1-Quantile-Accuracy": 98.16666412353516, "Augmented-Accuracy": 98.84616666666666, "Augmented-Loss": 0.07923769479649967, "Clean-Accuracy": 98.83333333333333, "Clean-Loss": 0.09421517286000229, "PGD-Accuracy": 4.133333333333334, "PGD-Loss": 21.20990838623047}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 146, "Epoch-Time": 241.37440729141235, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.18000030517578, "Augmented-0.05-Quantile-Accuracy": 96.93000030517578, "Augmented-0.1-Quantile-Accuracy": 97.79000091552734, "Augmented-Accuracy": 98.7839, "Augmented-Loss": 0.08993390582644939, "Clean-Accuracy": 98.97, "Clean-Loss": 0.04753212822079658, "PGD-Accuracy": 11.0, "PGD-Loss": 5.450405532836914}, "Total-Time": 34049.42269945145, "Train": {"Loss": 3.4106741501843487, "avg t": 1.0176164867613051, "plain loss": 0.22264903194992652, "standard loss": 0.11365614416562365}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.94999694824219, "Augmented-0.05-Quantile-Accuracy": 97.36666870117188, "Augmented-0.1-Quantile-Accuracy": 97.81666564941406, "Augmented-Accuracy": 98.82916666666667, "Augmented-Loss": 0.08344018163154522, "Clean-Accuracy": 99.0, "Clean-Loss": 0.045727390637000404, "PGD-Accuracy": 10.833333333333334, "PGD-Loss": 5.167427777608236}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 147, "Epoch-Time": 218.0525574684143, "Test": {"Augmented-0.01-Quantile-Accuracy": 94.16999816894531, "Augmented-0.05-Quantile-Accuracy": 96.62999725341797, "Augmented-0.1-Quantile-Accuracy": 97.5, "Augmented-Accuracy": 98.6614, "Augmented-Loss": 0.0962870610216856, "Clean-Accuracy": 99.04, "Clean-Loss": 0.0407879080966115, "PGD-Accuracy": 9.43, "PGD-Loss": 5.806916766357422}, "Total-Time": 34267.47525691986, "Train": {"Loss": 3.8642758731135616, "avg t": 1.0201872332537616, "plain loss": 0.2361512985794633, "standard loss": 0.12424398310040986}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 95.08333587646484, "Augmented-0.05-Quantile-Accuracy": 96.8499984741211, "Augmented-0.1-Quantile-Accuracy": 97.71666717529297, "Augmented-Accuracy": 98.74283333333334, "Augmented-Loss": 0.09046981611798206, "Clean-Accuracy": 99.05, "Clean-Loss": 0.0428124302799503, "PGD-Accuracy": 8.883333333333333, "PGD-Loss": 5.548018058776855}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 148, "Epoch-Time": 210.31347584724426, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.1199951171875, "Augmented-0.05-Quantile-Accuracy": 95.95999908447266, "Augmented-0.1-Quantile-Accuracy": 96.91999816894531, "Augmented-Accuracy": 98.4975, "Augmented-Loss": 0.11975098629713059, "Clean-Accuracy": 98.95, "Clean-Loss": 0.044121961537748576, "PGD-Accuracy": 10.59, "PGD-Loss": 5.6664210754394535}, "Total-Time": 34477.788732767105, "Train": {"Loss": 5.326838207032946, "avg t": 1.021132015298914, "plain loss": 0.23974783930955096, "standard loss": 0.11755365297529433}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.8499984741211, "Augmented-0.05-Quantile-Accuracy": 97.18333435058594, "Augmented-0.1-Quantile-Accuracy": 97.71666717529297, "Augmented-Accuracy": 98.7455, "Augmented-Loss": 0.10646383977641662, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.04087552690009276, "PGD-Accuracy": 9.883333333333333, "PGD-Loss": 5.3210487518310545}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 149, "Epoch-Time": 241.21121954917908, "Test": {"Augmented-0.01-Quantile-Accuracy": 93.43999481201172, "Augmented-0.05-Quantile-Accuracy": 96.0199966430664, "Augmented-0.1-Quantile-Accuracy": 96.89999389648438, "Augmented-Accuracy": 98.4619, "Augmented-Loss": 0.13601315144062043, "Clean-Accuracy": 98.87, "Clean-Loss": 0.05412838777601719, "PGD-Accuracy": 10.99, "PGD-Loss": 5.533473297119141}, "Total-Time": 34718.999952316284, "Train": {"Loss": 3.2605419757984304, "avg t": 1.0177149627826831, "plain loss": 0.22161787003764397, "standard loss": 0.10207354757803734}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 94.79999542236328, "Augmented-0.05-Quantile-Accuracy": 97.11666870117188, "Augmented-0.1-Quantile-Accuracy": 97.69999694824219, "Augmented-Accuracy": 98.76933333333334, "Augmented-Loss": 0.12535002425233524, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.052314291680852575, "PGD-Accuracy": 10.65, "PGD-Loss": 5.288635866800944}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.01, "cvar_sgd_t_step_size": 0.1, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_four/mnist_mod_001", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.01, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 0.1, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
