{"Epoch": 0, "Epoch-Time": 242.26470732688904, "Test": {"Augmented-0.01-Quantile-Accuracy": 95.56999969482422, "Augmented-0.05-Quantile-Accuracy": 96.72999572753906, "Augmented-0.1-Quantile-Accuracy": 97.0199966430664, "Augmented-Accuracy": 97.9998, "Augmented-Loss": 0.2132503671731949, "Clean-Accuracy": 98.2, "Clean-Loss": 0.1497007306098938, "PGD-Accuracy": 0.51, "PGD-Loss": 4.390511459350586}, "Total-Time": 242.26470732688904, "Train": {"Loss": 1.066843203050119, "avg t": 0.936123614858698, "plain loss": 0.43005698982521295, "standard loss": 0.3555979585338522}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 96.43333435058594, "Augmented-0.05-Quantile-Accuracy": 97.38333129882812, "Augmented-0.1-Quantile-Accuracy": 97.66666412353516, "Augmented-Accuracy": 98.4565, "Augmented-Loss": 0.1960630192367236, "Clean-Accuracy": 98.66666666666667, "Clean-Loss": 0.1362689696153005, "PGD-Accuracy": 0.55, "PGD-Loss": 4.403043980916341}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 1, "Epoch-Time": 242.06356024742126, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.75999450683594, "Augmented-0.05-Quantile-Accuracy": 97.39999389648438, "Augmented-0.1-Quantile-Accuracy": 97.75999450683594, "Augmented-Accuracy": 98.5931, "Augmented-Loss": 0.1779262647781372, "Clean-Accuracy": 98.81, "Clean-Loss": 0.1259930073261261, "PGD-Accuracy": 1.15, "PGD-Loss": 4.372187216186523}, "Total-Time": 484.3282675743103, "Train": {"Loss": 0.9667290913087351, "avg t": 0.9260506271256341, "plain loss": 0.2706896514468725, "standard loss": 0.20108990026844872}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.08333587646484, "Augmented-0.05-Quantile-Accuracy": 97.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.0999984741211, "Augmented-Accuracy": 98.677, "Augmented-Loss": 0.16978037031173707, "Clean-Accuracy": 98.75, "Clean-Loss": 0.12019706761837005, "PGD-Accuracy": 1.25, "PGD-Loss": 4.3372390162150065}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 2, "Epoch-Time": 242.27989768981934, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.25, "Augmented-0.05-Quantile-Accuracy": 97.2699966430664, "Augmented-0.1-Quantile-Accuracy": 97.70999908447266, "Augmented-Accuracy": 98.543, "Augmented-Loss": 0.19250181996536256, "Clean-Accuracy": 98.7, "Clean-Loss": 0.14153286662101747, "PGD-Accuracy": 0.39, "PGD-Loss": 5.8752130615234375}, "Total-Time": 726.6081652641296, "Train": {"Loss": 0.9555454852492721, "avg t": 0.9246298218656469, "plain loss": 0.23386597660205993, "standard loss": 0.17708374452590941}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.01666259765625, "Augmented-0.05-Quantile-Accuracy": 97.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.08333587646484, "Augmented-Accuracy": 98.73583333333333, "Augmented-Loss": 0.179799160006841, "Clean-Accuracy": 98.85, "Clean-Loss": 0.13249863620599112, "PGD-Accuracy": 0.2833333333333333, "PGD-Loss": 5.90055073038737}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 3, "Epoch-Time": 222.12532877922058, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.00999450683594, "Augmented-0.05-Quantile-Accuracy": 97.81999969482422, "Augmented-0.1-Quantile-Accuracy": 98.13999938964844, "Augmented-Accuracy": 98.8611, "Augmented-Loss": 0.1301109954557419, "Clean-Accuracy": 99.03, "Clean-Loss": 0.10000481731891632, "PGD-Accuracy": 0.78, "PGD-Loss": 6.454137493896484}, "Total-Time": 948.7334940433502, "Train": {"Loss": 0.9503283554359718, "avg t": 0.9239600489581072, "plain loss": 0.20975879775153256, "standard loss": 0.16414898260875985}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.44999694824219, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.28333282470703, "Augmented-Accuracy": 98.85583333333334, "Augmented-Loss": 0.12328510341246923, "Clean-Accuracy": 98.98333333333333, "Clean-Loss": 0.0959020672639211, "PGD-Accuracy": 0.7, "PGD-Loss": 6.449409489949544}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 4, "Epoch-Time": 209.33967351913452, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.88999938964844, "Augmented-0.05-Quantile-Accuracy": 97.63999938964844, "Augmented-0.1-Quantile-Accuracy": 98.02999877929688, "Augmented-Accuracy": 98.7446, "Augmented-Loss": 0.14702823393297196, "Clean-Accuracy": 98.86, "Clean-Loss": 0.11485862483978271, "PGD-Accuracy": 2.82, "PGD-Loss": 5.58544645690918}, "Total-Time": 1158.0731675624847, "Train": {"Loss": 0.9463742607964409, "avg t": 0.9234470021283185, "plain loss": 0.18679937873769664, "standard loss": 0.14752340359157987}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.38333129882812, "Augmented-0.05-Quantile-Accuracy": 98.04999542236328, "Augmented-0.1-Quantile-Accuracy": 98.28333282470703, "Augmented-Accuracy": 98.8705, "Augmented-Loss": 0.13521294268449147, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.1056861340602239, "PGD-Accuracy": 2.7, "PGD-Loss": 5.50721440633138}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 5, "Epoch-Time": 239.70506167411804, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.08999633789062, "Augmented-0.05-Quantile-Accuracy": 97.98999786376953, "Augmented-0.1-Quantile-Accuracy": 98.27999877929688, "Augmented-Accuracy": 98.8969, "Augmented-Loss": 0.1790440307970047, "Clean-Accuracy": 98.96, "Clean-Loss": 0.14511491980552674, "PGD-Accuracy": 3.94, "PGD-Loss": 5.666199664306641}, "Total-Time": 1397.7782292366028, "Train": {"Loss": 0.9443256595046432, "avg t": 0.9231290510318897, "plain loss": 0.1748355059235187, "standard loss": 0.13758133558873778}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.03333282470703, "Augmented-0.1-Quantile-Accuracy": 98.21666717529297, "Augmented-Accuracy": 98.85116666666667, "Augmented-Loss": 0.16681827482859293, "Clean-Accuracy": 98.95, "Clean-Loss": 0.1349384387334188, "PGD-Accuracy": 4.233333333333333, "PGD-Loss": 5.615811121622722}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 6, "Epoch-Time": 242.20881342887878, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.29000091552734, "Augmented-0.05-Quantile-Accuracy": 98.0999984741211, "Augmented-0.1-Quantile-Accuracy": 98.39999389648438, "Augmented-Accuracy": 98.9397, "Augmented-Loss": 0.10883422292089462, "Clean-Accuracy": 99.04, "Clean-Loss": 0.0891167741060257, "PGD-Accuracy": 2.18, "PGD-Loss": 6.570348916625977}, "Total-Time": 1639.9870426654816, "Train": {"Loss": 0.9428754291181212, "avg t": 0.9229012268384298, "plain loss": 0.16467210320013548, "standard loss": 0.13184010881406288}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.48332977294922, "Augmented-0.05-Quantile-Accuracy": 98.16666412353516, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 98.91666666666667, "Augmented-Loss": 0.10597038733283679, "Clean-Accuracy": 98.96666666666667, "Clean-Loss": 0.08793240332603455, "PGD-Accuracy": 2.6, "PGD-Loss": 6.517690633138021}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 7, "Epoch-Time": 242.01898503303528, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.13999938964844, "Augmented-0.05-Quantile-Accuracy": 98.06999969482422, "Augmented-0.1-Quantile-Accuracy": 98.29000091552734, "Augmented-Accuracy": 98.9001, "Augmented-Loss": 0.09531647759437561, "Clean-Accuracy": 99.01, "Clean-Loss": 0.07565094286203385, "PGD-Accuracy": 2.01, "PGD-Loss": 6.897724868774414}, "Total-Time": 1882.0060276985168, "Train": {"Loss": 0.9417288771205479, "avg t": 0.9226977828696922, "plain loss": 0.15532616134219707, "standard loss": 0.12098234396069138}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.6500015258789, "Augmented-0.05-Quantile-Accuracy": 98.26666259765625, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 98.987, "Augmented-Loss": 0.08708382933020592, "Clean-Accuracy": 99.05, "Clean-Loss": 0.070005399843057, "PGD-Accuracy": 2.2333333333333334, "PGD-Loss": 6.867080215454101}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 8, "Epoch-Time": 242.2552523612976, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.18999481201172, "Augmented-0.05-Quantile-Accuracy": 97.95999908447266, "Augmented-0.1-Quantile-Accuracy": 98.23999786376953, "Augmented-Accuracy": 98.8849, "Augmented-Loss": 0.11005059660100937, "Clean-Accuracy": 98.97, "Clean-Loss": 0.08633460500240325, "PGD-Accuracy": 2.18, "PGD-Loss": 7.088107293701172}, "Total-Time": 2124.2612800598145, "Train": {"Loss": 0.9407518543137444, "avg t": 0.9225665699994122, "plain loss": 0.15044362048749588, "standard loss": 0.11750699003979012}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.25, "Augmented-0.1-Quantile-Accuracy": 98.48332977294922, "Augmented-Accuracy": 98.95483333333334, "Augmented-Loss": 0.103559434085687, "Clean-Accuracy": 99.05, "Clean-Loss": 0.08234000939130783, "PGD-Accuracy": 2.4, "PGD-Loss": 7.081503911336263}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 9, "Epoch-Time": 204.98288822174072, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.31999969482422, "Augmented-0.05-Quantile-Accuracy": 98.14999389648438, "Augmented-0.1-Quantile-Accuracy": 98.3699951171875, "Augmented-Accuracy": 99.0184, "Augmented-Loss": 0.08749176116728782, "Clean-Accuracy": 99.05, "Clean-Loss": 0.07363669087886811, "PGD-Accuracy": 1.92, "PGD-Loss": 7.051618045043945}, "Total-Time": 2329.244168281555, "Train": {"Loss": 0.9402816980503224, "avg t": 0.9224706301512542, "plain loss": 0.14506906127929683, "standard loss": 0.1169799301204858}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.61666870117188, "Augmented-0.05-Quantile-Accuracy": 98.21666717529297, "Augmented-0.1-Quantile-Accuracy": 98.51666259765625, "Augmented-Accuracy": 99.05166666666666, "Augmented-Loss": 0.08297297616283099, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.07042387506365776, "PGD-Accuracy": 1.9833333333333334, "PGD-Loss": 6.96274323018392}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 10, "Epoch-Time": 224.01917934417725, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.29000091552734, "Augmented-0.05-Quantile-Accuracy": 97.97000122070312, "Augmented-0.1-Quantile-Accuracy": 98.29000091552734, "Augmented-Accuracy": 98.9498, "Augmented-Loss": 0.09195596079254151, "Clean-Accuracy": 99.06, "Clean-Loss": 0.07280758086442947, "PGD-Accuracy": 1.96, "PGD-Loss": 7.584225}, "Total-Time": 2553.2633476257324, "Train": {"Loss": 0.9398014645223264, "avg t": 0.9223875868408768, "plain loss": 0.13466761827468876, "standard loss": 0.10770925562911564}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.5, "Augmented-0.05-Quantile-Accuracy": 98.18333435058594, "Augmented-0.1-Quantile-Accuracy": 98.53333282470703, "Augmented-Accuracy": 99.0215, "Augmented-Loss": 0.0873113741328319, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.07018840005000432, "PGD-Accuracy": 1.9833333333333334, "PGD-Loss": 7.6004119364420575}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 11, "Epoch-Time": 242.0563542842865, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.79000091552734, "Augmented-0.05-Quantile-Accuracy": 97.66999816894531, "Augmented-0.1-Quantile-Accuracy": 97.97999572753906, "Augmented-Accuracy": 98.7688, "Augmented-Loss": 0.11470626304197311, "Clean-Accuracy": 98.86, "Clean-Loss": 0.08451492595672608, "PGD-Accuracy": 4.59, "PGD-Loss": 5.990081576538086}, "Total-Time": 2795.319701910019, "Train": {"Loss": 0.9395782434675428, "avg t": 0.922348486299868, "plain loss": 0.13318323673672153, "standard loss": 0.10280836002914993}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.11666870117188, "Augmented-0.05-Quantile-Accuracy": 97.96666717529297, "Augmented-0.1-Quantile-Accuracy": 98.1500015258789, "Augmented-Accuracy": 98.838, "Augmented-Loss": 0.10970572943290074, "Clean-Accuracy": 99.0, "Clean-Loss": 0.08274473547935486, "PGD-Accuracy": 4.033333333333333, "PGD-Loss": 5.929558792114258}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 12, "Epoch-Time": 242.45035004615784, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.89999389648438, "Augmented-0.05-Quantile-Accuracy": 97.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.11000061035156, "Augmented-Accuracy": 98.8087, "Augmented-Loss": 0.11143911889171601, "Clean-Accuracy": 98.88, "Clean-Loss": 0.08602890932559967, "PGD-Accuracy": 3.41, "PGD-Loss": 6.675840628051758}, "Total-Time": 3037.7700519561768, "Train": {"Loss": 0.939322671395761, "avg t": 0.9222958711871394, "plain loss": 0.1367318834446096, "standard loss": 0.1039189243890621}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.25, "Augmented-0.05-Quantile-Accuracy": 97.93333435058594, "Augmented-0.1-Quantile-Accuracy": 98.31666564941406, "Augmented-Accuracy": 98.87466666666667, "Augmented-Loss": 0.10648578725536664, "Clean-Accuracy": 99.05, "Clean-Loss": 0.08352172120412191, "PGD-Accuracy": 3.1, "PGD-Loss": 6.675749557495117}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 13, "Epoch-Time": 242.1295464038849, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.36000061035156, "Augmented-0.05-Quantile-Accuracy": 98.08999633789062, "Augmented-0.1-Quantile-Accuracy": 98.36000061035156, "Augmented-Accuracy": 99.0258, "Augmented-Loss": 0.09021894651985168, "Clean-Accuracy": 99.12, "Clean-Loss": 0.07224152963161469, "PGD-Accuracy": 3.51, "PGD-Loss": 6.519309301757812}, "Total-Time": 3279.8995983600616, "Train": {"Loss": 0.9392702182487205, "avg t": 0.9222833027486448, "plain loss": 0.13210834561453927, "standard loss": 0.10349949115514755}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.6500015258789, "Augmented-0.05-Quantile-Accuracy": 98.33333587646484, "Augmented-0.1-Quantile-Accuracy": 98.46666717529297, "Augmented-Accuracy": 99.041, "Augmented-Loss": 0.08655046556830406, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.07032527200380961, "PGD-Accuracy": 3.6166666666666667, "PGD-Loss": 6.5020428517659505}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 14, "Epoch-Time": 217.02871894836426, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.19999694824219, "Augmented-0.05-Quantile-Accuracy": 97.98999786376953, "Augmented-0.1-Quantile-Accuracy": 98.29999542236328, "Augmented-Accuracy": 98.9898, "Augmented-Loss": 0.09969329842019081, "Clean-Accuracy": 99.16, "Clean-Loss": 0.07556455466747283, "PGD-Accuracy": 4.07, "PGD-Loss": 6.519395251464844}, "Total-Time": 3496.928317308426, "Train": {"Loss": 0.9391848786671957, "avg t": 0.9222499026192559, "plain loss": 0.13015474716115877, "standard loss": 0.0975953348521833}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.46666717529297, "Augmented-0.05-Quantile-Accuracy": 98.03333282470703, "Augmented-0.1-Quantile-Accuracy": 98.31666564941406, "Augmented-Accuracy": 98.91366666666667, "Augmented-Loss": 0.09559528851727644, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.07400179614623388, "PGD-Accuracy": 4.516666666666667, "PGD-Loss": 6.451145833333333}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 15, "Epoch-Time": 211.18735027313232, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.32999420166016, "Augmented-0.05-Quantile-Accuracy": 98.04999542236328, "Augmented-0.1-Quantile-Accuracy": 98.3699951171875, "Augmented-Accuracy": 98.9982, "Augmented-Loss": 0.09120384966492653, "Clean-Accuracy": 99.05, "Clean-Loss": 0.0712321204662323, "PGD-Accuracy": 3.06, "PGD-Loss": 6.414730865478516}, "Total-Time": 3708.1156675815582, "Train": {"Loss": 0.938886960418136, "avg t": 0.9222191446445607, "plain loss": 0.12986187271895233, "standard loss": 0.0966823177602556}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.68333435058594, "Augmented-0.05-Quantile-Accuracy": 98.31666564941406, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 99.03816666666667, "Augmented-Loss": 0.08546300941705703, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.06796974154313405, "PGD-Accuracy": 3.216666666666667, "PGD-Loss": 6.341663218180338}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 16, "Epoch-Time": 241.9413502216339, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.25999450683594, "Augmented-0.05-Quantile-Accuracy": 98.00999450683594, "Augmented-0.1-Quantile-Accuracy": 98.3499984741211, "Augmented-Accuracy": 98.9358, "Augmented-Loss": 0.094017403185606, "Clean-Accuracy": 99.04, "Clean-Loss": 0.07314398891925812, "PGD-Accuracy": 3.82, "PGD-Loss": 6.587252130126953}, "Total-Time": 3950.057017803192, "Train": {"Loss": 0.9388382073861581, "avg t": 0.9221919170662208, "plain loss": 0.12453199209283898, "standard loss": 0.09306194637219112}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.54999542236328, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 98.9695, "Augmented-Loss": 0.08921188948869706, "Clean-Accuracy": 99.0, "Clean-Loss": 0.07045562257369359, "PGD-Accuracy": 3.716666666666667, "PGD-Loss": 6.519601842244466}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 17, "Epoch-Time": 242.42958235740662, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.04999542236328, "Augmented-0.1-Quantile-Accuracy": 98.31999969482422, "Augmented-Accuracy": 98.979, "Augmented-Loss": 0.09940205012202263, "Clean-Accuracy": 99.1, "Clean-Loss": 0.07506537847518921, "PGD-Accuracy": 3.55, "PGD-Loss": 6.680306481933593}, "Total-Time": 4192.486600160599, "Train": {"Loss": 0.9387874015702141, "avg t": 0.9221838917908846, "plain loss": 0.12155304141221221, "standard loss": 0.09189979977519423}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.41666412353516, "Augmented-0.05-Quantile-Accuracy": 98.25, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.04016666666666, "Augmented-Loss": 0.0933331047709783, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.07164446665843328, "PGD-Accuracy": 3.7333333333333334, "PGD-Loss": 6.681690338134765}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 18, "Epoch-Time": 241.98906874656677, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.39999389648438, "Augmented-0.05-Quantile-Accuracy": 98.23999786376953, "Augmented-0.1-Quantile-Accuracy": 98.47000122070312, "Augmented-Accuracy": 99.0125, "Augmented-Loss": 0.10439108861327172, "Clean-Accuracy": 99.1, "Clean-Loss": 0.07607748029232025, "PGD-Accuracy": 5.5, "PGD-Loss": 5.961161428833008}, "Total-Time": 4434.4756689071655, "Train": {"Loss": 0.9387242060060854, "avg t": 0.922162893931071, "plain loss": 0.12433861080452249, "standard loss": 0.09127596322695414}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.26666259765625, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 98.978, "Augmented-Loss": 0.09807046997090181, "Clean-Accuracy": 99.01666666666667, "Clean-Loss": 0.0728786458770434, "PGD-Accuracy": 5.483333333333333, "PGD-Loss": 5.904699872334798}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 19, "Epoch-Time": 239.45508193969727, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.43999481201172, "Augmented-0.05-Quantile-Accuracy": 98.13999938964844, "Augmented-0.1-Quantile-Accuracy": 98.48999786376953, "Augmented-Accuracy": 99.0495, "Augmented-Loss": 0.08691882079410553, "Clean-Accuracy": 99.17, "Clean-Loss": 0.0640051687836647, "PGD-Accuracy": 2.77, "PGD-Loss": 6.751573352050781}, "Total-Time": 4673.930750846863, "Train": {"Loss": 0.9386296536657546, "avg t": 0.922145243415126, "plain loss": 0.12150796727074516, "standard loss": 0.08861698451417464}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.68333435058594, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 98.99983333333333, "Augmented-Loss": 0.084790355681777, "Clean-Accuracy": 99.06666666666666, "Clean-Loss": 0.06476387534538905, "PGD-Accuracy": 2.8333333333333335, "PGD-Loss": 6.749642598470052}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 20, "Epoch-Time": 204.30103611946106, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.37999725341797, "Augmented-0.05-Quantile-Accuracy": 98.19999694824219, "Augmented-0.1-Quantile-Accuracy": 98.40999603271484, "Augmented-Accuracy": 99.0479, "Augmented-Loss": 0.08463915100502968, "Clean-Accuracy": 99.19, "Clean-Loss": 0.06578220357894897, "PGD-Accuracy": 2.91, "PGD-Loss": 6.521952893066406}, "Total-Time": 4878.231786966324, "Train": {"Loss": 0.9384899873027095, "avg t": 0.9221308048389576, "plain loss": 0.12167077758930328, "standard loss": 0.09191405220384952}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.79999542236328, "Augmented-0.05-Quantile-Accuracy": 98.48332977294922, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.07883333333334, "Augmented-Loss": 0.07992055411994457, "Clean-Accuracy": 99.15, "Clean-Loss": 0.06329203164577483, "PGD-Accuracy": 2.716666666666667, "PGD-Loss": 6.560439748128255}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 21, "Epoch-Time": 226.01680302619934, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.32999420166016, "Augmented-0.05-Quantile-Accuracy": 98.18999481201172, "Augmented-0.1-Quantile-Accuracy": 98.47000122070312, "Augmented-Accuracy": 99.0561, "Augmented-Loss": 0.09238398858046531, "Clean-Accuracy": 99.14, "Clean-Loss": 0.06920181064605713, "PGD-Accuracy": 2.98, "PGD-Loss": 6.741104092407227}, "Total-Time": 5104.248589992523, "Train": {"Loss": 0.9386025566878142, "avg t": 0.9221352888743083, "plain loss": 0.11639440643522472, "standard loss": 0.08791991586596877}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.6500015258789, "Augmented-0.05-Quantile-Accuracy": 98.26666259765625, "Augmented-0.1-Quantile-Accuracy": 98.56666564941406, "Augmented-Accuracy": 99.09116666666667, "Augmented-Loss": 0.0868583856813113, "Clean-Accuracy": 99.2, "Clean-Loss": 0.06649833593765894, "PGD-Accuracy": 3.3333333333333335, "PGD-Loss": 6.675492772420247}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 22, "Epoch-Time": 241.88745164871216, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.50999450683594, "Augmented-0.05-Quantile-Accuracy": 98.37999725341797, "Augmented-0.1-Quantile-Accuracy": 98.61000061035156, "Augmented-Accuracy": 99.1066, "Augmented-Loss": 0.08665316854929923, "Clean-Accuracy": 99.22, "Clean-Loss": 0.06282834059000016, "PGD-Accuracy": 3.94, "PGD-Loss": 6.361578775024414}, "Total-Time": 5346.136041641235, "Train": {"Loss": 0.9384239935698333, "avg t": 0.9221217084814001, "plain loss": 0.11817668387095148, "standard loss": 0.08665452939492685}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.41666412353516, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 99.08233333333334, "Augmented-Loss": 0.08184380099991957, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.06090269328157107, "PGD-Accuracy": 4.2, "PGD-Loss": 6.236003832499186}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 23, "Epoch-Time": 241.869877576828, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.22999572753906, "Augmented-0.05-Quantile-Accuracy": 98.04000091552734, "Augmented-0.1-Quantile-Accuracy": 98.33999633789062, "Augmented-Accuracy": 98.9921, "Augmented-Loss": 0.09336257291340828, "Clean-Accuracy": 99.15, "Clean-Loss": 0.06804216871261597, "PGD-Accuracy": 3.83, "PGD-Loss": 6.314211450195312}, "Total-Time": 5588.005919218063, "Train": {"Loss": 0.9385275955906621, "avg t": 0.9221287405932391, "plain loss": 0.11913908808672878, "standard loss": 0.08502899670159375}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.41666412353516, "Augmented-0.05-Quantile-Accuracy": 98.23332977294922, "Augmented-0.1-Quantile-Accuracy": 98.56666564941406, "Augmented-Accuracy": 99.03366666666666, "Augmented-Loss": 0.08682398128469786, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.06451760454972585, "PGD-Accuracy": 4.266666666666667, "PGD-Loss": 6.282019734700521}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 24, "Epoch-Time": 241.95537114143372, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.19999694824219, "Augmented-0.1-Quantile-Accuracy": 98.48999786376953, "Augmented-Accuracy": 99.0419, "Augmented-Loss": 0.09198332979488373, "Clean-Accuracy": 99.16, "Clean-Loss": 0.06926723666191101, "PGD-Accuracy": 4.25, "PGD-Loss": 6.259564416503906}, "Total-Time": 5829.961290359497, "Train": {"Loss": 0.9384709371990627, "avg t": 0.9221143109356915, "plain loss": 0.1169202612417715, "standard loss": 0.0840243295872653}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.53333282470703, "Augmented-0.05-Quantile-Accuracy": 98.13333129882812, "Augmented-0.1-Quantile-Accuracy": 98.31666564941406, "Augmented-Accuracy": 98.889, "Augmented-Loss": 0.08786391779045263, "Clean-Accuracy": 98.95, "Clean-Loss": 0.06803126009305319, "PGD-Accuracy": 4.166666666666667, "PGD-Loss": 6.177595016479493}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 25, "Epoch-Time": 213.17303323745728, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.08999633789062, "Augmented-0.1-Quantile-Accuracy": 98.32999420166016, "Augmented-Accuracy": 98.9798, "Augmented-Loss": 0.08028510926365852, "Clean-Accuracy": 99.09, "Clean-Loss": 0.060619753158092496, "PGD-Accuracy": 2.34, "PGD-Loss": 6.81406809387207}, "Total-Time": 6043.134323596954, "Train": {"Loss": 0.9383837348266885, "avg t": 0.9221022742942527, "plain loss": 0.11777950874257963, "standard loss": 0.08519797730004346}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.54999542236328, "Augmented-0.05-Quantile-Accuracy": 98.13333129882812, "Augmented-0.1-Quantile-Accuracy": 98.36666870117188, "Augmented-Accuracy": 98.93566666666666, "Augmented-Loss": 0.07668973752419155, "Clean-Accuracy": 98.96666666666667, "Clean-Loss": 0.059705082992712655, "PGD-Accuracy": 2.533333333333333, "PGD-Loss": 6.73687467956543}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 26, "Epoch-Time": 214.77835416793823, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.31999969482422, "Augmented-0.05-Quantile-Accuracy": 98.02999877929688, "Augmented-0.1-Quantile-Accuracy": 98.38999938964844, "Augmented-Accuracy": 98.9849, "Augmented-Loss": 0.08785603711628914, "Clean-Accuracy": 99.02, "Clean-Loss": 0.06728076636791229, "PGD-Accuracy": 3.2, "PGD-Loss": 6.447961340332031}, "Total-Time": 6257.912677764893, "Train": {"Loss": 0.9383774946707266, "avg t": 0.9220977783909551, "plain loss": 0.11642221978152245, "standard loss": 0.0852812093463209}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.68333435058594, "Augmented-0.05-Quantile-Accuracy": 98.33333587646484, "Augmented-0.1-Quantile-Accuracy": 98.53333282470703, "Augmented-Accuracy": 99.063, "Augmented-Loss": 0.08231235977629821, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.06374019079407056, "PGD-Accuracy": 3.6166666666666667, "PGD-Loss": 6.359782694498698}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 27, "Epoch-Time": 242.30771708488464, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.56999969482422, "Augmented-0.05-Quantile-Accuracy": 98.25, "Augmented-0.1-Quantile-Accuracy": 98.5199966430664, "Augmented-Accuracy": 99.0162, "Augmented-Loss": 0.09414158029675483, "Clean-Accuracy": 99.11, "Clean-Loss": 0.07353319754600525, "PGD-Accuracy": 2.93, "PGD-Loss": 6.3049742797851565}, "Total-Time": 6500.220394849777, "Train": {"Loss": 0.9383314875849971, "avg t": 0.9220959185847529, "plain loss": 0.11676607852865145, "standard loss": 0.08776717841845971}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.66666412353516, "Augmented-0.05-Quantile-Accuracy": 98.23332977294922, "Augmented-0.1-Quantile-Accuracy": 98.38333129882812, "Augmented-Accuracy": 98.97333333333333, "Augmented-Loss": 0.08900386558373768, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.07056810259819031, "PGD-Accuracy": 3.2333333333333334, "PGD-Loss": 6.2557222951253255}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 28, "Epoch-Time": 242.093079328537, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.63999938964844, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1356, "Augmented-Loss": 0.08102273975491524, "Clean-Accuracy": 99.24, "Clean-Loss": 0.06190153604745865, "PGD-Accuracy": 2.64, "PGD-Loss": 6.490744232177734}, "Total-Time": 6742.313474178314, "Train": {"Loss": 0.938417140395553, "avg t": 0.922092456040559, "plain loss": 0.1157963365360543, "standard loss": 0.08757346545435764}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.19283333333334, "Augmented-Loss": 0.07661281763474147, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05946642038226128, "PGD-Accuracy": 3.6, "PGD-Loss": 6.345139569600423}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 29, "Epoch-Time": 241.95020508766174, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.40999603271484, "Augmented-0.05-Quantile-Accuracy": 98.23999786376953, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.051, "Augmented-Loss": 0.08874033441472054, "Clean-Accuracy": 99.17, "Clean-Loss": 0.0668230140209198, "PGD-Accuracy": 3.75, "PGD-Loss": 6.260015509033203}, "Total-Time": 6984.263679265976, "Train": {"Loss": 0.9382946123900237, "avg t": 0.922083637908653, "plain loss": 0.11358241424913762, "standard loss": 0.08398510047903768}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.6500015258789, "Augmented-0.05-Quantile-Accuracy": 98.19999694824219, "Augmented-0.1-Quantile-Accuracy": 98.53333282470703, "Augmented-Accuracy": 99.02883333333334, "Augmented-Loss": 0.08352509675145149, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.06380035911003748, "PGD-Accuracy": 4.5, "PGD-Loss": 6.133435653686523}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 30, "Epoch-Time": 239.5751531124115, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.48999786376953, "Augmented-0.05-Quantile-Accuracy": 98.27999877929688, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.1144, "Augmented-Loss": 0.0988114107875824, "Clean-Accuracy": 99.16, "Clean-Loss": 0.07386416990756989, "PGD-Accuracy": 4.07, "PGD-Loss": 6.035381665039062}, "Total-Time": 7223.838832378387, "Train": {"Loss": 0.9383179921397456, "avg t": 0.9220882507960002, "plain loss": 0.11548496600610232, "standard loss": 0.08509682129930567}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.36666870117188, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.12016666666666, "Augmented-Loss": 0.09296951442023119, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.07042743251721065, "PGD-Accuracy": 4.283333333333333, "PGD-Loss": 5.953701670328776}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 31, "Epoch-Time": 202.30730676651, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.43000030517578, "Augmented-0.05-Quantile-Accuracy": 98.30999755859375, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 99.1381, "Augmented-Loss": 0.0898397075908184, "Clean-Accuracy": 99.26, "Clean-Loss": 0.0659703961610794, "PGD-Accuracy": 3.17, "PGD-Loss": 6.144751736450195}, "Total-Time": 7426.1461391448975, "Train": {"Loss": 0.9382846514383952, "avg t": 0.9220703001375552, "plain loss": 0.1135218085942446, "standard loss": 0.0822808263765441}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.76666259765625, "Augmented-0.05-Quantile-Accuracy": 98.41666412353516, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.0845, "Augmented-Loss": 0.08429048793653647, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.06317386378844579, "PGD-Accuracy": 3.4, "PGD-Loss": 6.070227447509765}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 32, "Epoch-Time": 228.59234523773193, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.5199966430664, "Augmented-0.05-Quantile-Accuracy": 98.29999542236328, "Augmented-0.1-Quantile-Accuracy": 98.54000091552734, "Augmented-Accuracy": 99.1003, "Augmented-Loss": 0.0924198626022339, "Clean-Accuracy": 99.22, "Clean-Loss": 0.07020183589458466, "PGD-Accuracy": 3.14, "PGD-Loss": 5.8855459594726565}, "Total-Time": 7654.738484382629, "Train": {"Loss": 0.9382608608669705, "avg t": 0.9220675606374388, "plain loss": 0.11348909831576873, "standard loss": 0.08526912007508454}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.81666564941406, "Augmented-0.05-Quantile-Accuracy": 98.28333282470703, "Augmented-0.1-Quantile-Accuracy": 98.51666259765625, "Augmented-Accuracy": 99.05166666666666, "Augmented-Loss": 0.08717649789631367, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.067137541949749, "PGD-Accuracy": 4.0, "PGD-Loss": 5.8064830830891925}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 33, "Epoch-Time": 242.117826461792, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68999481201172, "Augmented-0.05-Quantile-Accuracy": 98.32999420166016, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1346, "Augmented-Loss": 0.08018320533847809, "Clean-Accuracy": 99.26, "Clean-Loss": 0.05920444957017899, "PGD-Accuracy": 2.39, "PGD-Loss": 6.74252769165039}, "Total-Time": 7896.856310844421, "Train": {"Loss": 0.9382364246933549, "avg t": 0.9220675511183563, "plain loss": 0.11325683922944242, "standard loss": 0.0841762556389526}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.12416666666667, "Augmented-Loss": 0.07671592291235924, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05821747835477193, "PGD-Accuracy": 3.25, "PGD-Loss": 6.585372492472331}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 34, "Epoch-Time": 242.01616835594177, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.54999542236328, "Augmented-0.05-Quantile-Accuracy": 98.25999450683594, "Augmented-0.1-Quantile-Accuracy": 98.45999908447266, "Augmented-Accuracy": 99.0655, "Augmented-Loss": 0.07732524905633927, "Clean-Accuracy": 99.18, "Clean-Loss": 0.05711172804832459, "PGD-Accuracy": 2.3, "PGD-Loss": 6.070516427612304}, "Total-Time": 8138.872479200363, "Train": {"Loss": 0.9382362288898892, "avg t": 0.9220614573160807, "plain loss": 0.1144272401067947, "standard loss": 0.08150897472434573}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.79999542236328, "Augmented-0.05-Quantile-Accuracy": 98.48332977294922, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.1245, "Augmented-Loss": 0.07327385655979315, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05535085793336233, "PGD-Accuracy": 2.466666666666667, "PGD-Loss": 5.955200709025065}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 35, "Epoch-Time": 242.287348985672, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.50999450683594, "Augmented-0.05-Quantile-Accuracy": 98.1199951171875, "Augmented-0.1-Quantile-Accuracy": 98.38999938964844, "Augmented-Accuracy": 99.106, "Augmented-Loss": 0.08363833773779869, "Clean-Accuracy": 99.25, "Clean-Loss": 0.06170764803886414, "PGD-Accuracy": 2.92, "PGD-Loss": 5.911152487182617}, "Total-Time": 8381.159828186035, "Train": {"Loss": 0.9382611630051224, "avg t": 0.9220668461411088, "plain loss": 0.11646969213485726, "standard loss": 0.08435460727303117}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.71666717529297, "Augmented-0.05-Quantile-Accuracy": 98.33333587646484, "Augmented-0.1-Quantile-Accuracy": 98.56666564941406, "Augmented-Accuracy": 99.03233333333333, "Augmented-Loss": 0.07936734597543875, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.06012730293472608, "PGD-Accuracy": 3.25, "PGD-Loss": 5.828791498819987}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 36, "Epoch-Time": 208.80315375328064, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.62999725341797, "Augmented-0.05-Quantile-Accuracy": 98.23999786376953, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.1308, "Augmented-Loss": 0.09120022540855408, "Clean-Accuracy": 99.28, "Clean-Loss": 0.064954634141922, "PGD-Accuracy": 1.74, "PGD-Loss": 6.034924386596679}, "Total-Time": 8589.962981939316, "Train": {"Loss": 0.9382589805920919, "avg t": 0.9220686889224582, "plain loss": 0.1145004756750884, "standard loss": 0.08164790739174242}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.8499984741211, "Augmented-0.05-Quantile-Accuracy": 98.43333435058594, "Augmented-0.1-Quantile-Accuracy": 98.63333129882812, "Augmented-Accuracy": 99.06483333333334, "Augmented-Loss": 0.08584377714971701, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.06272924106319745, "PGD-Accuracy": 2.25, "PGD-Loss": 5.922914408365886}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 37, "Epoch-Time": 218.51096153259277, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68999481201172, "Augmented-0.05-Quantile-Accuracy": 98.39999389648438, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.1455, "Augmented-Loss": 0.08612856417918205, "Clean-Accuracy": 99.28, "Clean-Loss": 0.062197443234920505, "PGD-Accuracy": 2.46, "PGD-Loss": 5.998701715087891}, "Total-Time": 8808.473943471909, "Train": {"Loss": 0.9382072719291404, "avg t": 0.9220548878599096, "plain loss": 0.11506990985870366, "standard loss": 0.08279147556755277}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.81666564941406, "Augmented-0.05-Quantile-Accuracy": 98.41666412353516, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.079, "Augmented-Loss": 0.08294341374576092, "Clean-Accuracy": 99.15, "Clean-Loss": 0.0616816844244798, "PGD-Accuracy": 2.7, "PGD-Loss": 5.860780400594075}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 38, "Epoch-Time": 242.36081218719482, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.6199951171875, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.54000091552734, "Augmented-Accuracy": 99.0673, "Augmented-Loss": 0.08223196674895286, "Clean-Accuracy": 99.17, "Clean-Loss": 0.06007446796894073, "PGD-Accuracy": 2.11, "PGD-Loss": 6.249502792358398}, "Total-Time": 9050.834755659103, "Train": {"Loss": 0.9382340686939381, "avg t": 0.9220640501269588, "plain loss": 0.11199177733174079, "standard loss": 0.07919171391372327}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.48332977294922, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.10083333333333, "Augmented-Loss": 0.07844300939897696, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05891817847887675, "PGD-Accuracy": 2.3833333333333333, "PGD-Loss": 6.129506556193034}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 39, "Epoch-Time": 241.8907027244568, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.45999908447266, "Augmented-0.05-Quantile-Accuracy": 98.20999908447266, "Augmented-0.1-Quantile-Accuracy": 98.50999450683594, "Augmented-Accuracy": 99.0666, "Augmented-Loss": 0.0900568362288475, "Clean-Accuracy": 99.17, "Clean-Loss": 0.06740953984260559, "PGD-Accuracy": 2.62, "PGD-Loss": 6.054709185791015}, "Total-Time": 9292.72545838356, "Train": {"Loss": 0.9382793708730627, "avg t": 0.9220629228662561, "plain loss": 0.1131136871479177, "standard loss": 0.08054576856780936}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.86666870117188, "Augmented-0.05-Quantile-Accuracy": 98.41666412353516, "Augmented-0.1-Quantile-Accuracy": 98.5999984741211, "Augmented-Accuracy": 99.107, "Augmented-Loss": 0.0842658168009917, "Clean-Accuracy": 99.15, "Clean-Loss": 0.06384254528085391, "PGD-Accuracy": 3.0833333333333335, "PGD-Loss": 6.0534532979329425}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 40, "Epoch-Time": 241.95513939857483, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.64999389648438, "Augmented-0.05-Quantile-Accuracy": 98.2699966430664, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.1045, "Augmented-Loss": 0.08186227373504638, "Clean-Accuracy": 99.23, "Clean-Loss": 0.05918187519311905, "PGD-Accuracy": 2.85, "PGD-Loss": 6.087452520751953}, "Total-Time": 9534.680597782135, "Train": {"Loss": 0.9381389650062278, "avg t": 0.9220496593934518, "plain loss": 0.10862979487666367, "standard loss": 0.0794775850530024}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.81666564941406, "Augmented-0.05-Quantile-Accuracy": 98.51666259765625, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.10466666666666, "Augmented-Loss": 0.07620780526379745, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.056199009358882904, "PGD-Accuracy": 3.066666666666667, "PGD-Loss": 6.094033935546875}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 41, "Epoch-Time": 238.07542848587036, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.70999908447266, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.6199951171875, "Augmented-Accuracy": 99.1656, "Augmented-Loss": 0.08401555440568924, "Clean-Accuracy": 99.32, "Clean-Loss": 0.05921288549900055, "PGD-Accuracy": 2.33, "PGD-Loss": 6.062298529052734}, "Total-Time": 9772.756026268005, "Train": {"Loss": 0.9381790267273232, "avg t": 0.9220488486113372, "plain loss": 0.10999439318974831, "standard loss": 0.07871134201685588}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.98332977294922, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.13433333333333, "Augmented-Loss": 0.07921026249508063, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.0572387737929821, "PGD-Accuracy": 2.8666666666666667, "PGD-Loss": 6.03533322652181}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 42, "Epoch-Time": 201.77126669883728, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.58999633789062, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.61000061035156, "Augmented-Accuracy": 99.1512, "Augmented-Loss": 0.08463278272652626, "Clean-Accuracy": 99.29, "Clean-Loss": 0.06102233920097351, "PGD-Accuracy": 2.63, "PGD-Loss": 5.933047842407227}, "Total-Time": 9974.527292966843, "Train": {"Loss": 0.9381825559404161, "avg t": 0.9220445466924597, "plain loss": 0.10981100402054972, "standard loss": 0.07701189587955122}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.9000015258789, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.19466666666666, "Augmented-Loss": 0.07957693046967189, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05839371878902117, "PGD-Accuracy": 3.25, "PGD-Loss": 5.893345369974772}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 43, "Epoch-Time": 230.9026746749878, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.39999389648438, "Augmented-0.05-Quantile-Accuracy": 98.18999481201172, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.0529, "Augmented-Loss": 0.08489711442303657, "Clean-Accuracy": 99.08, "Clean-Loss": 0.06263948456048965, "PGD-Accuracy": 2.52, "PGD-Loss": 6.080163342285156}, "Total-Time": 10205.42996764183, "Train": {"Loss": 0.9381162050211871, "avg t": 0.9220386444550973, "plain loss": 0.10852116943995166, "standard loss": 0.07757754825441926}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.53333282470703, "Augmented-0.05-Quantile-Accuracy": 98.31666564941406, "Augmented-0.1-Quantile-Accuracy": 98.51666259765625, "Augmented-Accuracy": 99.1165, "Augmented-Loss": 0.08027810430824757, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.060511012415091193, "PGD-Accuracy": 2.9833333333333334, "PGD-Loss": 6.027102798461914}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 44, "Epoch-Time": 242.32775235176086, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.63999938964844, "Augmented-0.05-Quantile-Accuracy": 98.32999420166016, "Augmented-0.1-Quantile-Accuracy": 98.56999969482422, "Augmented-Accuracy": 99.166, "Augmented-Loss": 0.07517352615165711, "Clean-Accuracy": 99.29, "Clean-Loss": 0.05576320761442184, "PGD-Accuracy": 2.2, "PGD-Loss": 5.938301513671875}, "Total-Time": 10447.757719993591, "Train": {"Loss": 0.938094041329843, "avg t": 0.9220375354201705, "plain loss": 0.10668304458370903, "standard loss": 0.075490223939772}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.151, "Augmented-Loss": 0.07138142134884994, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.0542163514594237, "PGD-Accuracy": 2.7, "PGD-Loss": 5.8440249811808265}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 45, "Epoch-Time": 241.83898878097534, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.56999969482422, "Augmented-0.05-Quantile-Accuracy": 98.27999877929688, "Augmented-0.1-Quantile-Accuracy": 98.56999969482422, "Augmented-Accuracy": 99.105, "Augmented-Loss": 0.07769990426635742, "Clean-Accuracy": 99.23, "Clean-Loss": 0.0564679855465889, "PGD-Accuracy": 2.55, "PGD-Loss": 5.835083859252929}, "Total-Time": 10689.596708774567, "Train": {"Loss": 0.9381465911865234, "avg t": 0.9220391178131103, "plain loss": 0.10691222011601488, "standard loss": 0.07535253178852576}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.75, "Augmented-0.05-Quantile-Accuracy": 98.43333435058594, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.077, "Augmented-Loss": 0.07405280423382918, "Clean-Accuracy": 99.15, "Clean-Loss": 0.05524068925778071, "PGD-Accuracy": 3.033333333333333, "PGD-Loss": 5.734828643798828}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 46, "Epoch-Time": 242.03078269958496, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.64999389648438, "Augmented-0.05-Quantile-Accuracy": 98.3699951171875, "Augmented-0.1-Quantile-Accuracy": 98.5199966430664, "Augmented-Accuracy": 99.1151, "Augmented-Loss": 0.08604954752063751, "Clean-Accuracy": 99.21, "Clean-Loss": 0.061954402458667755, "PGD-Accuracy": 2.32, "PGD-Loss": 5.85872350769043}, "Total-Time": 10931.627491474152, "Train": {"Loss": 0.938133374814634, "avg t": 0.9220382867036042, "plain loss": 0.10912754409578099, "standard loss": 0.07606688529142627}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.04999542236328, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.14966666666666, "Augmented-Loss": 0.07995100480159124, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05873498477538427, "PGD-Accuracy": 2.5, "PGD-Loss": 5.746773513793945}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 47, "Epoch-Time": 206.65810632705688, "Test": {"Augmented-0.01-Quantile-Accuracy": 96.80999755859375, "Augmented-0.05-Quantile-Accuracy": 97.88999938964844, "Augmented-0.1-Quantile-Accuracy": 98.29999542236328, "Augmented-Accuracy": 98.8351, "Augmented-Loss": 0.08729423835086822, "Clean-Accuracy": 98.89, "Clean-Loss": 0.06474441738128663, "PGD-Accuracy": 2.13, "PGD-Loss": 6.088299295043945}, "Total-Time": 11138.285597801208, "Train": {"Loss": 0.9381343348467791, "avg t": 0.9220311111167625, "plain loss": 0.11195776980011551, "standard loss": 0.0790763172728044}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.18333435058594, "Augmented-0.05-Quantile-Accuracy": 97.8499984741211, "Augmented-0.1-Quantile-Accuracy": 98.1500015258789, "Augmented-Accuracy": 98.807, "Augmented-Loss": 0.08350754958232244, "Clean-Accuracy": 98.91666666666667, "Clean-Loss": 0.06317624477545421, "PGD-Accuracy": 2.3666666666666667, "PGD-Loss": 5.994016822814942}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 48, "Epoch-Time": 219.56668496131897, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.83999633789062, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.1672, "Augmented-Loss": 0.0716670512419939, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05205397779941559, "PGD-Accuracy": 1.98, "PGD-Loss": 6.169540960693359}, "Total-Time": 11357.852282762527, "Train": {"Loss": 0.9380558950636122, "avg t": 0.9220210325453017, "plain loss": 0.10585351344920964, "standard loss": 0.07429418822460704}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.88333129882812, "Augmented-0.05-Quantile-Accuracy": 98.43333435058594, "Augmented-0.1-Quantile-Accuracy": 98.68333435058594, "Augmented-Accuracy": 99.13866666666667, "Augmented-Loss": 0.06871929032842318, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.051413089702526726, "PGD-Accuracy": 2.15, "PGD-Loss": 6.0687893168131515}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 49, "Epoch-Time": 242.18103766441345, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.70999908447266, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 99.0779, "Augmented-Loss": 0.07407081060039997, "Clean-Accuracy": 99.18, "Clean-Loss": 0.054716119170188905, "PGD-Accuracy": 2.5, "PGD-Loss": 5.99733362121582}, "Total-Time": 11600.033320426941, "Train": {"Loss": 0.9380493353561119, "avg t": 0.922027244426586, "plain loss": 0.10824194121184168, "standard loss": 0.07592407550635161}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.83333587646484, "Augmented-0.05-Quantile-Accuracy": 98.41666412353516, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.14333333333333, "Augmented-Loss": 0.0699944743047158, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05326801538467407, "PGD-Accuracy": 2.6333333333333333, "PGD-Loss": 5.973612101236979}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 50, "Epoch-Time": 242.33608961105347, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.48999786376953, "Augmented-0.05-Quantile-Accuracy": 98.25, "Augmented-0.1-Quantile-Accuracy": 98.44999694824219, "Augmented-Accuracy": 99.0176, "Augmented-Loss": 0.08688439219689369, "Clean-Accuracy": 99.07, "Clean-Loss": 0.06331583262681961, "PGD-Accuracy": 2.74, "PGD-Loss": 5.715276098632812}, "Total-Time": 11842.369410037994, "Train": {"Loss": 0.938212475405799, "avg t": 0.922051173598678, "plain loss": 0.11075200102064332, "standard loss": 0.07886547912712451}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.83333587646484, "Augmented-0.05-Quantile-Accuracy": 98.43333435058594, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.11383333333333, "Augmented-Loss": 0.08032935724794865, "Clean-Accuracy": 99.1, "Clean-Loss": 0.059397326946258544, "PGD-Accuracy": 3.1666666666666665, "PGD-Loss": 5.66270166015625}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 51, "Epoch-Time": 242.18734979629517, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.06999969482422, "Augmented-0.1-Quantile-Accuracy": 98.31999969482422, "Augmented-Accuracy": 98.994, "Augmented-Loss": 0.08310516870069504, "Clean-Accuracy": 99.13, "Clean-Loss": 0.0618151417016983, "PGD-Accuracy": 2.97, "PGD-Loss": 5.757387982177734}, "Total-Time": 12084.55675983429, "Train": {"Loss": 0.9380838830382736, "avg t": 0.9220384404924181, "plain loss": 0.10830608029718759, "standard loss": 0.07770983370807436}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.83333587646484, "Augmented-0.05-Quantile-Accuracy": 98.31666564941406, "Augmented-0.1-Quantile-Accuracy": 98.54999542236328, "Augmented-Accuracy": 99.05483333333333, "Augmented-Loss": 0.07710259734928608, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.05808505515257518, "PGD-Accuracy": 3.283333333333333, "PGD-Loss": 5.67355633799235}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 52, "Epoch-Time": 234.3525950908661, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.32999420166016, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.1583, "Augmented-Loss": 0.08603136776709557, "Clean-Accuracy": 99.29, "Clean-Loss": 0.06376683830022811, "PGD-Accuracy": 2.27, "PGD-Loss": 6.113480023193359}, "Total-Time": 12318.909354925156, "Train": {"Loss": 0.9381419106942636, "avg t": 0.922034072805334, "plain loss": 0.10787025684074127, "standard loss": 0.07742864108968664}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.01666259765625, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.16616666666667, "Augmented-Loss": 0.08080773383577665, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.060737233638763426, "PGD-Accuracy": 2.7, "PGD-Loss": 6.045969792683919}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 53, "Epoch-Time": 203.21707940101624, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.5999984741211, "Augmented-Accuracy": 99.176, "Augmented-Loss": 0.08467424268722534, "Clean-Accuracy": 99.3, "Clean-Loss": 0.061547512781620024, "PGD-Accuracy": 2.13, "PGD-Loss": 5.963144482421875}, "Total-Time": 12522.126434326172, "Train": {"Loss": 0.938179229400776, "avg t": 0.9220364666691533, "plain loss": 0.10885273152633959, "standard loss": 0.07749788796460187}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.1565, "Augmented-Loss": 0.0795834893021981, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05892846538623174, "PGD-Accuracy": 1.9833333333333334, "PGD-Loss": 5.90671012878418}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 54, "Epoch-Time": 232.87954998016357, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.57999420166016, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.57999420166016, "Augmented-Accuracy": 99.104, "Augmented-Loss": 0.07431097469568253, "Clean-Accuracy": 99.21, "Clean-Loss": 0.0542464035987854, "PGD-Accuracy": 2.48, "PGD-Loss": 5.695219812011719}, "Total-Time": 12755.005984306335, "Train": {"Loss": 0.9380537176485415, "avg t": 0.9220294344160291, "plain loss": 0.10847986392974854, "standard loss": 0.0770106828444534}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.98332977294922, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.61666870117188, "Augmented-Accuracy": 99.08216666666667, "Augmented-Loss": 0.0695232938716809, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.051874942710002266, "PGD-Accuracy": 2.8833333333333333, "PGD-Loss": 5.596383819580078}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 55, "Epoch-Time": 242.0136604309082, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.62999725341797, "Augmented-0.05-Quantile-Accuracy": 98.33999633789062, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.1428, "Augmented-Loss": 0.07470401794934273, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05509545518159866, "PGD-Accuracy": 2.01, "PGD-Loss": 5.84776005859375}, "Total-Time": 12997.019644737244, "Train": {"Loss": 0.938157626328645, "avg t": 0.9220360118018256, "plain loss": 0.10764830795923873, "standard loss": 0.07612449099399425}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.94999694824219, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.15733333333333, "Augmented-Loss": 0.06933052030324936, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05234435352683067, "PGD-Accuracy": 2.7333333333333334, "PGD-Loss": 5.7570926971435545}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 56, "Epoch-Time": 242.0531656742096, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75999450683594, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.70999908447266, "Augmented-Accuracy": 99.1661, "Augmented-Loss": 0.07054395355057716, "Clean-Accuracy": 99.24, "Clean-Loss": 0.052387886416912076, "PGD-Accuracy": 2.11, "PGD-Loss": 6.133909402465821}, "Total-Time": 13239.072810411453, "Train": {"Loss": 0.9380537406780102, "avg t": 0.9220236365706832, "plain loss": 0.10577302693967465, "standard loss": 0.07545189875805819}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.48332977294922, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.154, "Augmented-Loss": 0.06711865066369374, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05117560716470083, "PGD-Accuracy": 2.433333333333333, "PGD-Loss": 6.03451725769043}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 57, "Epoch-Time": 242.11485719680786, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72999572753906, "Augmented-0.05-Quantile-Accuracy": 98.32999420166016, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.1201, "Augmented-Loss": 0.07640019810962677, "Clean-Accuracy": 99.22, "Clean-Loss": 0.05781826858520508, "PGD-Accuracy": 2.52, "PGD-Loss": 5.728606210327149}, "Total-Time": 13481.187667608261, "Train": {"Loss": 0.9381214774096454, "avg t": 0.9220261053155969, "plain loss": 0.1086710911150331, "standard loss": 0.07741698755158319}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.01666259765625, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.16616666666667, "Augmented-Loss": 0.07115010763367018, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.05451528285940488, "PGD-Accuracy": 2.683333333333333, "PGD-Loss": 5.627766746520996}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 58, "Epoch-Time": 206.01890635490417, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.50999450683594, "Augmented-0.05-Quantile-Accuracy": 98.29000091552734, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.1105, "Augmented-Loss": 0.08595383532691002, "Clean-Accuracy": 99.23, "Clean-Loss": 0.06404784543514251, "PGD-Accuracy": 3.29, "PGD-Loss": 5.544883950805664}, "Total-Time": 13687.206573963165, "Train": {"Loss": 0.9380753513795358, "avg t": 0.9220229031951339, "plain loss": 0.10712414728447228, "standard loss": 0.07790194036783996}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.86666870117188, "Augmented-0.05-Quantile-Accuracy": 98.41666412353516, "Augmented-0.1-Quantile-Accuracy": 98.63333129882812, "Augmented-Accuracy": 99.08933333333333, "Augmented-Loss": 0.08012176442245643, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.060231136778990425, "PGD-Accuracy": 3.75, "PGD-Loss": 5.482391001383464}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 59, "Epoch-Time": 219.53961038589478, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.86000061035156, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1564, "Augmented-Loss": 0.07948180088829994, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05940169467926026, "PGD-Accuracy": 2.77, "PGD-Loss": 5.502135775756836}, "Total-Time": 13906.74618434906, "Train": {"Loss": 0.9380542567394398, "avg t": 0.9220148796152186, "plain loss": 0.10764903599774392, "standard loss": 0.07884979506333668}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.17166666666667, "Augmented-Loss": 0.07466540256361166, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05679090855518977, "PGD-Accuracy": 3.2666666666666666, "PGD-Loss": 5.450955032348633}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 60, "Epoch-Time": 242.2149612903595, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.38999938964844, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.1794, "Augmented-Loss": 0.07231288900065422, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05353014522790909, "PGD-Accuracy": 2.34, "PGD-Loss": 5.773220504760742}, "Total-Time": 14148.96114563942, "Train": {"Loss": 0.9380892426879318, "avg t": 0.9220212922272859, "plain loss": 0.10562085591245597, "standard loss": 0.07673738016022576}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.11666870117188, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.19766666666666, "Augmented-Loss": 0.06734395215988159, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05097510149081548, "PGD-Accuracy": 2.8833333333333333, "PGD-Loss": 5.680521041870117}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 61, "Epoch-Time": 241.908136844635, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.6199951171875, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1503, "Augmented-Loss": 0.07804544557857514, "Clean-Accuracy": 99.22, "Clean-Loss": 0.059005414056777956, "PGD-Accuracy": 2.9, "PGD-Loss": 5.70777135925293}, "Total-Time": 14390.869282484055, "Train": {"Loss": 0.9380902078593218, "avg t": 0.9220211962947139, "plain loss": 0.10667698599144261, "standard loss": 0.07883398429552714}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.16566666666667, "Augmented-Loss": 0.07350730296214422, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05611877878506978, "PGD-Accuracy": 3.05, "PGD-Loss": 5.634968363444011}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 62, "Epoch-Time": 241.99533224105835, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.63999938964844, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1132, "Augmented-Loss": 0.08000462195086479, "Clean-Accuracy": 99.17, "Clean-Loss": 0.05981316686868668, "PGD-Accuracy": 1.84, "PGD-Loss": 5.982817324829101}, "Total-Time": 14632.864614725113, "Train": {"Loss": 0.9380463522451895, "avg t": 0.9220088794849537, "plain loss": 0.10482030755678813, "standard loss": 0.0757176070301621}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.01666259765625, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.123, "Augmented-Loss": 0.0759912410924832, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.057815795282522835, "PGD-Accuracy": 2.25, "PGD-Loss": 5.8773329722086585}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 63, "Epoch-Time": 231.10413885116577, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.73999786376953, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.1654, "Augmented-Loss": 0.07582856389689445, "Clean-Accuracy": 99.2, "Clean-Loss": 0.056334062325954434, "PGD-Accuracy": 1.79, "PGD-Loss": 5.934575003051758}, "Total-Time": 14863.968753576279, "Train": {"Loss": 0.9380968763210156, "avg t": 0.9220283249042652, "plain loss": 0.10612963563777797, "standard loss": 0.07747624621788661}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.12916666666666, "Augmented-Loss": 0.07237863612294197, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.0550589984357357, "PGD-Accuracy": 2.1166666666666667, "PGD-Loss": 5.878166803995768}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 64, "Epoch-Time": 204.86743545532227, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.77999877929688, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1885, "Augmented-Loss": 0.08045500321722031, "Clean-Accuracy": 99.33, "Clean-Loss": 0.05991073219776154, "PGD-Accuracy": 2.34, "PGD-Loss": 5.686590414428711}, "Total-Time": 15068.836189031601, "Train": {"Loss": 0.9380368852262144, "avg t": 0.9220134812284398, "plain loss": 0.1052476117663912, "standard loss": 0.0762304651538531}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.19016666666667, "Augmented-Loss": 0.07658402775088946, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05788907840847969, "PGD-Accuracy": 2.6166666666666667, "PGD-Loss": 5.620158864339193}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 65, "Epoch-Time": 234.80818009376526, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.77999877929688, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.1679, "Augmented-Loss": 0.07237885810899734, "Clean-Accuracy": 99.24, "Clean-Loss": 0.05445621120929718, "PGD-Accuracy": 1.67, "PGD-Loss": 6.192089440917969}, "Total-Time": 15303.644369125366, "Train": {"Loss": 0.9380197511955544, "avg t": 0.9220083774990505, "plain loss": 0.10509048664481546, "standard loss": 0.07694250049855975}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.03333282470703, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.22816666666667, "Augmented-Loss": 0.06807086129883926, "Clean-Accuracy": 99.35, "Clean-Loss": 0.05216665610671043, "PGD-Accuracy": 1.85, "PGD-Loss": 6.152626622517904}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 66, "Epoch-Time": 241.970317363739, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1476, "Augmented-Loss": 0.07425594858503341, "Clean-Accuracy": 99.22, "Clean-Loss": 0.055814444363117215, "PGD-Accuracy": 1.81, "PGD-Loss": 6.263928021240234}, "Total-Time": 15545.614686489105, "Train": {"Loss": 0.9380130047268338, "avg t": 0.9220057351854113, "plain loss": 0.10269038927996602, "standard loss": 0.07446420908195}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.1485, "Augmented-Loss": 0.07034472047448158, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05382641174395879, "PGD-Accuracy": 2.216666666666667, "PGD-Loss": 6.194184611002604}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 67, "Epoch-Time": 242.21249389648438, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.73999786376953, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.192, "Augmented-Loss": 0.0717143346323967, "Clean-Accuracy": 99.32, "Clean-Loss": 0.052157280337810516, "PGD-Accuracy": 2.16, "PGD-Loss": 5.825733926391601}, "Total-Time": 15787.82718038559, "Train": {"Loss": 0.9380355252866391, "avg t": 0.922007201247745, "plain loss": 0.10073883102205075, "standard loss": 0.07162141243395982}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.11666870117188, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.20633333333333, "Augmented-Loss": 0.06786928828756014, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.050583859890699384, "PGD-Accuracy": 2.25, "PGD-Loss": 5.764242268880208}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 68, "Epoch-Time": 241.6483359336853, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75, "Augmented-0.05-Quantile-Accuracy": 98.3499984741211, "Augmented-0.1-Quantile-Accuracy": 98.65999603271484, "Augmented-Accuracy": 99.128, "Augmented-Loss": 0.07154291464805602, "Clean-Accuracy": 99.24, "Clean-Loss": 0.05294717907905579, "PGD-Accuracy": 1.72, "PGD-Loss": 5.985500088500976}, "Total-Time": 16029.475516319275, "Train": {"Loss": 0.9380732246328283, "avg t": 0.9220188319947984, "plain loss": 0.10452607087735775, "standard loss": 0.07381875488934693}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.98332977294922, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.15866666666666, "Augmented-Loss": 0.06773961054285367, "Clean-Accuracy": 99.16666666666667, "Clean-Loss": 0.051193068852027256, "PGD-Accuracy": 2.2, "PGD-Loss": 5.9153977915445966}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 69, "Epoch-Time": 206.83568692207336, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.2055, "Augmented-Loss": 0.06538210255730152, "Clean-Accuracy": 99.3, "Clean-Loss": 0.048779823863506315, "PGD-Accuracy": 1.8, "PGD-Loss": 5.921339749145508}, "Total-Time": 16236.311203241348, "Train": {"Loss": 0.9379685817294651, "avg t": 0.9220021353297764, "plain loss": 0.10099734475171133, "standard loss": 0.0726673222956834}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.01666259765625, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.16383333333333, "Augmented-Loss": 0.062098505521516, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04747703908880552, "PGD-Accuracy": 2.3666666666666667, "PGD-Loss": 5.885509264628093}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 70, "Epoch-Time": 219.5079050064087, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72999572753906, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.1783, "Augmented-Loss": 0.07597835874342919, "Clean-Accuracy": 99.32, "Clean-Loss": 0.05517984935045242, "PGD-Accuracy": 1.45, "PGD-Loss": 5.924876068115235}, "Total-Time": 16455.819108247757, "Train": {"Loss": 0.9380739655671296, "avg t": 0.9220125051427771, "plain loss": 0.10202144797996235, "standard loss": 0.07224562678513703}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.06666564941406, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.71666717529297, "Augmented-Accuracy": 99.16166666666666, "Augmented-Loss": 0.07140399189472199, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05298882055282593, "PGD-Accuracy": 1.9333333333333333, "PGD-Loss": 5.8031846720377604}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 71, "Epoch-Time": 241.95721435546875, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72999572753906, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1576, "Augmented-Loss": 0.0738730021109581, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05408690938949585, "PGD-Accuracy": 1.94, "PGD-Loss": 5.788445626831055}, "Total-Time": 16697.776322603226, "Train": {"Loss": 0.9380299532854999, "avg t": 0.9220172325416848, "plain loss": 0.10168953075408936, "standard loss": 0.07133475009158806}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.51666259765625, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.1385, "Augmented-Loss": 0.06930902039011319, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05183979667226474, "PGD-Accuracy": 2.183333333333333, "PGD-Loss": 5.743802434285482}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 72, "Epoch-Time": 242.03191542625427, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93000030517578, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.2132, "Augmented-Loss": 0.07057674496495724, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05000861591100693, "PGD-Accuracy": 1.74, "PGD-Loss": 6.049326574707031}, "Total-Time": 16939.80823802948, "Train": {"Loss": 0.9379728276288067, "avg t": 0.9219974980530915, "plain loss": 0.09820119414152911, "standard loss": 0.06827831955309267}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.21283333333334, "Augmented-Loss": 0.06710308675130208, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.04900719484686852, "PGD-Accuracy": 2.05, "PGD-Loss": 5.976139694213868}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 73, "Epoch-Time": 242.3669331073761, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72999572753906, "Augmented-0.05-Quantile-Accuracy": 98.38999938964844, "Augmented-0.1-Quantile-Accuracy": 98.64999389648438, "Augmented-Accuracy": 99.1436, "Augmented-Loss": 0.08345693076324463, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05990074743032455, "PGD-Accuracy": 2.18, "PGD-Loss": 5.7350202056884765}, "Total-Time": 17182.175171136856, "Train": {"Loss": 0.9380610602696736, "avg t": 0.9220070077048408, "plain loss": 0.10027580505300447, "standard loss": 0.07037102734269919}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.93333435058594, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.63333129882812, "Augmented-Accuracy": 99.12516666666667, "Augmented-Loss": 0.07932206143359344, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.058325313806533816, "PGD-Accuracy": 2.716666666666667, "PGD-Loss": 5.588826187133789}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 74, "Epoch-Time": 228.11888027191162, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.64999389648438, "Augmented-0.05-Quantile-Accuracy": 98.36000061035156, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.1494, "Augmented-Loss": 0.0710267547172308, "Clean-Accuracy": 99.25, "Clean-Loss": 0.052715767526626586, "PGD-Accuracy": 2.13, "PGD-Loss": 5.911546008300781}, "Total-Time": 17410.294051408768, "Train": {"Loss": 0.9380197358308016, "avg t": 0.9220112326586688, "plain loss": 0.10429760756139408, "standard loss": 0.07317589803371165}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.12283333333333, "Augmented-Loss": 0.06675688048879305, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05066060923536619, "PGD-Accuracy": 2.7333333333333334, "PGD-Loss": 5.814233210245768}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 75, "Epoch-Time": 208.13200545310974, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.73999786376953, "Augmented-0.05-Quantile-Accuracy": 98.37999725341797, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.1492, "Augmented-Loss": 0.08368602147388458, "Clean-Accuracy": 99.23, "Clean-Loss": 0.061256438183784484, "PGD-Accuracy": 2.05, "PGD-Loss": 5.908936923217773}, "Total-Time": 17618.426056861877, "Train": {"Loss": 0.9379945942914044, "avg t": 0.9219989841779073, "plain loss": 0.10137367414545133, "standard loss": 0.07272652721515409}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.11766666666666, "Augmented-Loss": 0.07916870343029499, "Clean-Accuracy": 99.2, "Clean-Loss": 0.058910116235415144, "PGD-Accuracy": 2.3666666666666667, "PGD-Loss": 5.874539204915364}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 76, "Epoch-Time": 237.78136277198792, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.68000030517578, "Augmented-0.05-Quantile-Accuracy": 98.29000091552734, "Augmented-0.1-Quantile-Accuracy": 98.43999481201172, "Augmented-Accuracy": 99.0908, "Augmented-Loss": 0.07105571188151837, "Clean-Accuracy": 99.26, "Clean-Loss": 0.05237115191221237, "PGD-Accuracy": 1.1, "PGD-Loss": 6.621282968139648}, "Total-Time": 17856.207419633865, "Train": {"Loss": 0.9379670285825377, "avg t": 0.9219978841145834, "plain loss": 0.10044828709849607, "standard loss": 0.07251014929568327}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.91666412353516, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.6500015258789, "Augmented-Accuracy": 99.06066666666666, "Augmented-Loss": 0.0687588090266784, "Clean-Accuracy": 99.13333333333334, "Clean-Loss": 0.052048264652490614, "PGD-Accuracy": 1.4333333333333333, "PGD-Loss": 6.473658650716146}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 77, "Epoch-Time": 241.91666650772095, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.40999603271484, "Augmented-0.05-Quantile-Accuracy": 98.18999481201172, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.0328, "Augmented-Loss": 0.07662731020045281, "Clean-Accuracy": 99.14, "Clean-Loss": 0.05797756768465042, "PGD-Accuracy": 1.61, "PGD-Loss": 6.088661019897461}, "Total-Time": 18098.124086141586, "Train": {"Loss": 0.9380022857807301, "avg t": 0.9220004777908325, "plain loss": 0.10189612590648507, "standard loss": 0.07380733662181431}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.73332977294922, "Augmented-0.05-Quantile-Accuracy": 98.33333587646484, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 99.07383333333334, "Augmented-Loss": 0.07205609867135683, "Clean-Accuracy": 99.11666666666666, "Clean-Loss": 0.055444002876679103, "PGD-Accuracy": 2.2, "PGD-Loss": 5.978564463297526}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 78, "Epoch-Time": 242.01240253448486, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.62999725341797, "Augmented-0.05-Quantile-Accuracy": 98.30999755859375, "Augmented-0.1-Quantile-Accuracy": 98.58999633789062, "Augmented-Accuracy": 99.1109, "Augmented-Loss": 0.06717545925784112, "Clean-Accuracy": 99.19, "Clean-Loss": 0.05180957826375961, "PGD-Accuracy": 1.99, "PGD-Loss": 6.163081060791016}, "Total-Time": 18340.13648867607, "Train": {"Loss": 0.937988532172309, "avg t": 0.921996900010992, "plain loss": 0.10438151460930155, "standard loss": 0.07662013335581179}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0, "Augmented-0.05-Quantile-Accuracy": 98.51666259765625, "Augmented-0.1-Quantile-Accuracy": 98.6500015258789, "Augmented-Accuracy": 99.13983333333333, "Augmented-Loss": 0.06335285048186778, "Clean-Accuracy": 99.25, "Clean-Loss": 0.049895434925953545, "PGD-Accuracy": 2.45, "PGD-Loss": 6.082433369954427}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 79, "Epoch-Time": 242.10709071159363, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.87999725341797, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.70999908447266, "Augmented-Accuracy": 99.2082, "Augmented-Loss": 0.07344479669427871, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05495066919326782, "PGD-Accuracy": 1.59, "PGD-Loss": 5.927372894287109}, "Total-Time": 18582.243579387665, "Train": {"Loss": 0.937985023993033, "avg t": 0.9219980961128518, "plain loss": 0.09850455257451092, "standard loss": 0.07222675774384428}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.228, "Augmented-Loss": 0.06955543163955212, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.052872043470541634, "PGD-Accuracy": 2.1333333333333333, "PGD-Loss": 5.863641042073568}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 80, "Epoch-Time": 205.64589715003967, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75999450683594, "Augmented-0.05-Quantile-Accuracy": 98.43999481201172, "Augmented-0.1-Quantile-Accuracy": 98.63999938964844, "Augmented-Accuracy": 99.1493, "Augmented-Loss": 0.0768379846739769, "Clean-Accuracy": 99.24, "Clean-Loss": 0.058166974890232086, "PGD-Accuracy": 1.94, "PGD-Loss": 5.670695516967774}, "Total-Time": 18787.889476537704, "Train": {"Loss": 0.9379717110704493, "avg t": 0.9219957909054226, "plain loss": 0.10178636344627097, "standard loss": 0.07480663368437025}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.9000015258789, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.63333129882812, "Augmented-Accuracy": 99.122, "Augmented-Loss": 0.07376577421883743, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05706304066379865, "PGD-Accuracy": 2.466666666666667, "PGD-Loss": 5.607523854573568}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 81, "Epoch-Time": 220.14442682266235, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.48999786376953, "Augmented-0.05-Quantile-Accuracy": 98.31999969482422, "Augmented-0.1-Quantile-Accuracy": 98.5199966430664, "Augmented-Accuracy": 99.0971, "Augmented-Loss": 0.08873303084135055, "Clean-Accuracy": 99.21, "Clean-Loss": 0.06619562708139419, "PGD-Accuracy": 2.3, "PGD-Loss": 5.714747253417968}, "Total-Time": 19008.033903360367, "Train": {"Loss": 0.9379725072825397, "avg t": 0.9219908048841688, "plain loss": 0.10070740286862408, "standard loss": 0.07340112429636496}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.68333435058594, "Augmented-0.05-Quantile-Accuracy": 98.33333587646484, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 99.06666666666666, "Augmented-Loss": 0.08350114239255588, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.0632643775343895, "PGD-Accuracy": 2.85, "PGD-Loss": 5.610921432495117}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 82, "Epoch-Time": 242.2017843723297, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.58999633789062, "Augmented-0.05-Quantile-Accuracy": 98.25, "Augmented-0.1-Quantile-Accuracy": 98.43999481201172, "Augmented-Accuracy": 99.0048, "Augmented-Loss": 0.07540912380480766, "Clean-Accuracy": 99.1, "Clean-Loss": 0.05641146725416184, "PGD-Accuracy": 2.31, "PGD-Loss": 6.032060336303711}, "Total-Time": 19250.235687732697, "Train": {"Loss": 0.9379715323448181, "avg t": 0.9219911904511628, "plain loss": 0.09790050694147749, "standard loss": 0.07216609466958929}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.81666564941406, "Augmented-0.05-Quantile-Accuracy": 98.46666717529297, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 99.05983333333333, "Augmented-Loss": 0.07179856240491073, "Clean-Accuracy": 99.05, "Clean-Loss": 0.054952100306749345, "PGD-Accuracy": 2.45, "PGD-Loss": 5.970335606892903}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 83, "Epoch-Time": 241.9910593032837, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.47999572753906, "Augmented-0.05-Quantile-Accuracy": 98.20999908447266, "Augmented-0.1-Quantile-Accuracy": 98.5, "Augmented-Accuracy": 99.0284, "Augmented-Loss": 0.07910179743075371, "Clean-Accuracy": 99.11, "Clean-Loss": 0.059375703704357144, "PGD-Accuracy": 1.6, "PGD-Loss": 6.0502975402832035}, "Total-Time": 19492.22674703598, "Train": {"Loss": 0.937941059536404, "avg t": 0.9219882470590097, "plain loss": 0.09728807254720623, "standard loss": 0.0712117990873478}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.76666259765625, "Augmented-0.05-Quantile-Accuracy": 98.28333282470703, "Augmented-0.1-Quantile-Accuracy": 98.58333587646484, "Augmented-Accuracy": 98.97533333333334, "Augmented-Loss": 0.0750891662333409, "Clean-Accuracy": 99.08333333333333, "Clean-Loss": 0.05755811653534571, "PGD-Accuracy": 2.0166666666666666, "PGD-Loss": 5.9049640604654945}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 84, "Epoch-Time": 242.22775030136108, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.65999603271484, "Augmented-0.05-Quantile-Accuracy": 98.37999725341797, "Augmented-0.1-Quantile-Accuracy": 98.6199951171875, "Augmented-Accuracy": 99.1083, "Augmented-Loss": 0.06909019840669632, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05123220281600952, "PGD-Accuracy": 2.59, "PGD-Loss": 5.884867178344726}, "Total-Time": 19734.45449733734, "Train": {"Loss": 0.9379684758362947, "avg t": 0.9219925314055549, "plain loss": 0.09421708094632196, "standard loss": 0.06774071004876384}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.16516666666666, "Augmented-Loss": 0.06451641881366571, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.04897243611017863, "PGD-Accuracy": 2.75, "PGD-Loss": 5.807672948201497}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 85, "Epoch-Time": 223.09733867645264, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.87999725341797, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.1747, "Augmented-Loss": 0.0750286757235527, "Clean-Accuracy": 99.24, "Clean-Loss": 0.05517426697015762, "PGD-Accuracy": 1.9, "PGD-Loss": 6.0259592163085935}, "Total-Time": 19957.551836013794, "Train": {"Loss": 0.9379406246962371, "avg t": 0.9219859936325638, "plain loss": 0.09833809599523183, "standard loss": 0.06988172129348472}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.2365, "Augmented-Loss": 0.07067740349590779, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.053087374935547514, "PGD-Accuracy": 2.533333333333333, "PGD-Loss": 5.935210973103841}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 86, "Epoch-Time": 209.17095184326172, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.81999969482422, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.72000122070312, "Augmented-Accuracy": 99.1657, "Augmented-Loss": 0.07570752266860008, "Clean-Accuracy": 99.29, "Clean-Loss": 0.05552309130430222, "PGD-Accuracy": 2.09, "PGD-Loss": 5.740240051269531}, "Total-Time": 20166.722787857056, "Train": {"Loss": 0.9379418794490673, "avg t": 0.9219907558582447, "plain loss": 0.09796356916780836, "standard loss": 0.06972908780309889}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.01666259765625, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.1995, "Augmented-Loss": 0.07161788113137087, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05371177213390668, "PGD-Accuracy": 2.6166666666666667, "PGD-Loss": 5.683355590820312}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 87, "Epoch-Time": 239.92212629318237, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75999450683594, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.1903, "Augmented-Loss": 0.0726487583565712, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05508706916570663, "PGD-Accuracy": 1.96, "PGD-Loss": 6.045773468017578}, "Total-Time": 20406.644914150238, "Train": {"Loss": 0.93790020748421, "avg t": 0.9219825382939092, "plain loss": 0.09857693587232516, "standard loss": 0.07213864684987951}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.1855, "Augmented-Loss": 0.0681888466334343, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.0527201088766257, "PGD-Accuracy": 2.4833333333333334, "PGD-Loss": 5.955089589436849}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 88, "Epoch-Time": 242.2227828502655, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.57999420166016, "Augmented-0.1-Quantile-Accuracy": 98.75999450683594, "Augmented-Accuracy": 99.2151, "Augmented-Loss": 0.06410301700937748, "Clean-Accuracy": 99.32, "Clean-Loss": 0.048645119774341584, "PGD-Accuracy": 2.12, "PGD-Loss": 6.113038461303711}, "Total-Time": 20648.867697000504, "Train": {"Loss": 0.9379352959173697, "avg t": 0.921984370690805, "plain loss": 0.09935938786400687, "standard loss": 0.07351738004993509}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.219, "Augmented-Loss": 0.061544850378731884, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.04790570232272148, "PGD-Accuracy": 2.7, "PGD-Loss": 6.021783983866373}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 89, "Epoch-Time": 242.2510986328125, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93999481201172, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.1931, "Augmented-Loss": 0.07444621877980233, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05680360552072525, "PGD-Accuracy": 1.82, "PGD-Loss": 6.024825344848633}, "Total-Time": 20891.118795633316, "Train": {"Loss": 0.9379605712890625, "avg t": 0.9219858758714464, "plain loss": 0.09859681248135041, "standard loss": 0.07304065829736216}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.169, "Augmented-Loss": 0.06980695129374663, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.0540452635884285, "PGD-Accuracy": 2.2333333333333334, "PGD-Loss": 5.985815653483073}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 90, "Epoch-Time": 242.24130487442017, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93000030517578, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.72000122070312, "Augmented-Accuracy": 99.1864, "Augmented-Loss": 0.07553581300878524, "Clean-Accuracy": 99.24, "Clean-Loss": 0.057499589133262634, "PGD-Accuracy": 1.68, "PGD-Loss": 5.846785836791992}, "Total-Time": 21133.360100507736, "Train": {"Loss": 0.9380066289725127, "avg t": 0.9219888454013401, "plain loss": 0.10039916721979773, "standard loss": 0.07443256942210374}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.19633333333333, "Augmented-Loss": 0.0711507289793094, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05507338908314705, "PGD-Accuracy": 1.7833333333333334, "PGD-Loss": 5.7681484781901045}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 91, "Epoch-Time": 203.65563869476318, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75999450683594, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.81999969482422, "Augmented-Accuracy": 99.2031, "Augmented-Loss": 0.07273791057753563, "Clean-Accuracy": 99.28, "Clean-Loss": 0.05489807875156403, "PGD-Accuracy": 1.6, "PGD-Loss": 6.06247177734375}, "Total-Time": 21337.0157392025, "Train": {"Loss": 0.9379125850465563, "avg t": 0.9219801838486283, "plain loss": 0.09903553850739091, "standard loss": 0.07343427360609725}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.94999694824219, "Augmented-Accuracy": 99.24083333333333, "Augmented-Loss": 0.06850423431177934, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.052421590795119606, "PGD-Accuracy": 1.7333333333333334, "PGD-Loss": 5.997426223754883}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 92, "Epoch-Time": 222.7741436958313, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.5199966430664, "Augmented-0.1-Quantile-Accuracy": 98.75999450683594, "Augmented-Accuracy": 99.1876, "Augmented-Loss": 0.07575753906154632, "Clean-Accuracy": 99.33, "Clean-Loss": 0.05587443469762802, "PGD-Accuracy": 2.55, "PGD-Loss": 5.906958953857422}, "Total-Time": 21559.78988289833, "Train": {"Loss": 0.9378782626964428, "avg t": 0.9219784778312401, "plain loss": 0.09389791601322317, "standard loss": 0.0673799313240581}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.22466666666666, "Augmented-Loss": 0.07123752532919247, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05352596998214722, "PGD-Accuracy": 3.0, "PGD-Loss": 5.810998184204101}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 93, "Epoch-Time": 242.02741503715515, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.69999694824219, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.5999984741211, "Augmented-Accuracy": 99.1699, "Augmented-Loss": 0.07583012397861481, "Clean-Accuracy": 99.28, "Clean-Loss": 0.056936237108707426, "PGD-Accuracy": 2.39, "PGD-Loss": 5.637045361328125}, "Total-Time": 21801.817297935486, "Train": {"Loss": 0.9379766124795984, "avg t": 0.9219877370198568, "plain loss": 0.09809639721799776, "standard loss": 0.07143619610203637}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.04999542236328, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.1985, "Augmented-Loss": 0.07062324190378189, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.05378766528765361, "PGD-Accuracy": 2.75, "PGD-Loss": 5.555377769470215}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 94, "Epoch-Time": 242.182697057724, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.81999969482422, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1905, "Augmented-Loss": 0.07233477274560929, "Clean-Accuracy": 99.3, "Clean-Loss": 0.05311155973672867, "PGD-Accuracy": 2.61, "PGD-Loss": 5.789514990234375}, "Total-Time": 22043.99999499321, "Train": {"Loss": 0.9378870109628749, "avg t": 0.9219733462863499, "plain loss": 0.09824087675589097, "standard loss": 0.07074134882511916}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.18533333333333, "Augmented-Loss": 0.06808062546074391, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05099108821153641, "PGD-Accuracy": 2.716666666666667, "PGD-Loss": 5.690109296162923}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 95, "Epoch-Time": 241.97692155838013, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.88999938964844, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1751, "Augmented-Loss": 0.06862607304537297, "Clean-Accuracy": 99.24, "Clean-Loss": 0.05203421380519867, "PGD-Accuracy": 1.77, "PGD-Loss": 5.78296760559082}, "Total-Time": 22285.97691655159, "Train": {"Loss": 0.9379182111422221, "avg t": 0.921980570545903, "plain loss": 0.0986991748474262, "standard loss": 0.07143143116765552}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.179, "Augmented-Loss": 0.06370408209095399, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04922790539264679, "PGD-Accuracy": 2.3, "PGD-Loss": 5.719361717224121}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 96, "Epoch-Time": 218.76538610458374, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.55999755859375, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.212, "Augmented-Loss": 0.07204492541718482, "Clean-Accuracy": 99.28, "Clean-Loss": 0.053421128034591675, "PGD-Accuracy": 2.07, "PGD-Loss": 5.595995037841797}, "Total-Time": 22504.742302656174, "Train": {"Loss": 0.9378801935690421, "avg t": 0.9219789118590178, "plain loss": 0.09584599124767157, "standard loss": 0.06958592792131282}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.1995, "Augmented-Loss": 0.06824823436538378, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.05180046144127846, "PGD-Accuracy": 2.1333333333333333, "PGD-Loss": 5.5028392105102535}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 97, "Epoch-Time": 210.52921748161316, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.43000030517578, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1598, "Augmented-Loss": 0.06351372176241875, "Clean-Accuracy": 99.29, "Clean-Loss": 0.04827584211230278, "PGD-Accuracy": 2.15, "PGD-Loss": 5.840889642333984}, "Total-Time": 22715.271520137787, "Train": {"Loss": 0.9378841733755888, "avg t": 0.9219823148515489, "plain loss": 0.09665471002084251, "standard loss": 0.06949654875861273}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.18766666666667, "Augmented-Loss": 0.05970292056451241, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.04621514907479286, "PGD-Accuracy": 2.4, "PGD-Loss": 5.740960670471192}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 98, "Epoch-Time": 241.33675527572632, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.40999603271484, "Augmented-0.1-Quantile-Accuracy": 98.66999816894531, "Augmented-Accuracy": 99.1765, "Augmented-Loss": 0.0731205921201706, "Clean-Accuracy": 99.31, "Clean-Loss": 0.05500038590431213, "PGD-Accuracy": 2.1, "PGD-Loss": 5.645003945922851}, "Total-Time": 22956.608275413513, "Train": {"Loss": 0.9379900896637529, "avg t": 0.9219882201088799, "plain loss": 0.09718039261500046, "standard loss": 0.07053106088991519}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.189, "Augmented-Loss": 0.06830494114538034, "Clean-Accuracy": 99.3, "Clean-Loss": 0.0522404624124368, "PGD-Accuracy": 2.783333333333333, "PGD-Loss": 5.596091550191243}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 99, "Epoch-Time": 242.06276535987854, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.8699951171875, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.70999908447266, "Augmented-Accuracy": 99.1932, "Augmented-Loss": 0.07939944347572327, "Clean-Accuracy": 99.24, "Clean-Loss": 0.0599570381641388, "PGD-Accuracy": 2.11, "PGD-Loss": 5.593355569458008}, "Total-Time": 23198.67104077339, "Train": {"Loss": 0.9379335378894099, "avg t": 0.9219842939730044, "plain loss": 0.10092593769850547, "standard loss": 0.0732356372586003}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.96666717529297, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.14283333333333, "Augmented-Loss": 0.07493120176970959, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05748121750354767, "PGD-Accuracy": 2.1, "PGD-Loss": 5.52562016805013}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 100, "Epoch-Time": 241.88917541503906, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.00999450683594, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.2146, "Augmented-Loss": 0.06861944706213474, "Clean-Accuracy": 99.33, "Clean-Loss": 0.05094227486848831, "PGD-Accuracy": 2.02, "PGD-Loss": 6.001541940307617}, "Total-Time": 23440.56021618843, "Train": {"Loss": 0.9379047269114742, "avg t": 0.9219711385656286, "plain loss": 0.09525319894861298, "standard loss": 0.06832135890700199}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.197, "Augmented-Loss": 0.06489727763493856, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.04932697579264641, "PGD-Accuracy": 2.1666666666666665, "PGD-Loss": 5.950920542399088}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 101, "Epoch-Time": 241.4707236289978, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75999450683594, "Augmented-0.05-Quantile-Accuracy": 98.38999938964844, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1596, "Augmented-Loss": 0.07560324765872956, "Clean-Accuracy": 99.32, "Clean-Loss": 0.055226956868171695, "PGD-Accuracy": 2.67, "PGD-Loss": 5.687485757446289}, "Total-Time": 23682.03093981743, "Train": {"Loss": 0.9378986997957582, "avg t": 0.9219793832567003, "plain loss": 0.09343103186995892, "standard loss": 0.06640907774148164}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.1755, "Augmented-Loss": 0.07131751815577347, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.05301550968488057, "PGD-Accuracy": 2.8333333333333335, "PGD-Loss": 5.577032170613607}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 102, "Epoch-Time": 203.72802424430847, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.83999633789062, "Augmented-0.05-Quantile-Accuracy": 98.43999481201172, "Augmented-0.1-Quantile-Accuracy": 98.72000122070312, "Augmented-Accuracy": 99.1701, "Augmented-Loss": 0.07829546143746376, "Clean-Accuracy": 99.28, "Clean-Loss": 0.056709127390384674, "PGD-Accuracy": 1.78, "PGD-Loss": 5.531838244628906}, "Total-Time": 23885.758964061737, "Train": {"Loss": 0.9378443131093626, "avg t": 0.9219732996975935, "plain loss": 0.0932465335157182, "standard loss": 0.06522761602644567}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.1905, "Augmented-Loss": 0.07349123927791913, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05414769401152929, "PGD-Accuracy": 2.65, "PGD-Loss": 5.510109555562337}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 103, "Epoch-Time": 225.4325168132782, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.66999816894531, "Augmented-0.05-Quantile-Accuracy": 98.36000061035156, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1479, "Augmented-Loss": 0.08463412964081764, "Clean-Accuracy": 99.27, "Clean-Loss": 0.06006185299158096, "PGD-Accuracy": 2.66, "PGD-Loss": 5.279053323364258}, "Total-Time": 24111.191480875015, "Train": {"Loss": 0.9379487489417747, "avg t": 0.9219866175828156, "plain loss": 0.09858232972180402, "standard loss": 0.0689046380939307}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 97.93333435058594, "Augmented-0.05-Quantile-Accuracy": 98.5, "Augmented-0.1-Quantile-Accuracy": 98.66666412353516, "Augmented-Accuracy": 99.094, "Augmented-Loss": 0.0797733437349399, "Clean-Accuracy": 99.18333333333334, "Clean-Loss": 0.05771111377080282, "PGD-Accuracy": 2.8666666666666667, "PGD-Loss": 5.247153177897135}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 104, "Epoch-Time": 242.0965874195099, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.75999450683594, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.62999725341797, "Augmented-Accuracy": 99.1248, "Augmented-Loss": 0.07485228334474564, "Clean-Accuracy": 99.23, "Clean-Loss": 0.054257508182525636, "PGD-Accuracy": 2.42, "PGD-Loss": 5.506256582641601}, "Total-Time": 24353.288068294525, "Train": {"Loss": 0.9378906206201624, "avg t": 0.9219773983602171, "plain loss": 0.0976238517125447, "standard loss": 0.06764124253723357}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.61666870117188, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.2375, "Augmented-Loss": 0.06935135408202807, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05100658162434896, "PGD-Accuracy": 2.7666666666666666, "PGD-Loss": 5.396920557657878}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 105, "Epoch-Time": 242.01138758659363, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.90999603271484, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.186, "Augmented-Loss": 0.07145218250751495, "Clean-Accuracy": 99.32, "Clean-Loss": 0.05026176733970642, "PGD-Accuracy": 1.71, "PGD-Loss": 5.812768634033203}, "Total-Time": 24595.29945588112, "Train": {"Loss": 0.9379944476728086, "avg t": 0.9219832711396394, "plain loss": 0.09615516630278706, "standard loss": 0.0665588396191597}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.19383333333333, "Augmented-Loss": 0.06760389078617096, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04892311715086301, "PGD-Accuracy": 1.9166666666666667, "PGD-Loss": 5.699767913818359}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 106, "Epoch-Time": 242.4038269519806, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.02999877929688, "Augmented-0.05-Quantile-Accuracy": 98.56999969482422, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.2262, "Augmented-Loss": 0.06319399719309807, "Clean-Accuracy": 99.32, "Clean-Loss": 0.0452359073638916, "PGD-Accuracy": 1.42, "PGD-Loss": 5.851115747070312}, "Total-Time": 24837.7032828331, "Train": {"Loss": 0.9378917442957561, "avg t": 0.9219803389090079, "plain loss": 0.093661357528192, "standard loss": 0.06404738066814564}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.79999542236328, "Augmented-0.1-Quantile-Accuracy": 99.0, "Augmented-Accuracy": 99.261, "Augmented-Loss": 0.05951503216574589, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.04394296775261561, "PGD-Accuracy": 1.7666666666666666, "PGD-Loss": 5.76646359761556}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 107, "Epoch-Time": 213.74331212043762, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.89999389648438, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.1699, "Augmented-Loss": 0.06755809924793243, "Clean-Accuracy": 99.28, "Clean-Loss": 0.048853346478939054, "PGD-Accuracy": 1.75, "PGD-Loss": 5.7013791473388675}, "Total-Time": 25051.446594953537, "Train": {"Loss": 0.9379242456400836, "avg t": 0.9219735784883852, "plain loss": 0.09120029792785642, "standard loss": 0.06411278043852912}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.20016666666666, "Augmented-Loss": 0.06282522447655599, "Clean-Accuracy": 99.3, "Clean-Loss": 0.046470385114351906, "PGD-Accuracy": 1.8166666666666667, "PGD-Loss": 5.6468944829305014}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 108, "Epoch-Time": 214.171630859375, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.93000030517578, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1718, "Augmented-Loss": 0.07230595231556892, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05362547738552093, "PGD-Accuracy": 1.43, "PGD-Loss": 5.916007867431641}, "Total-Time": 25265.618225812912, "Train": {"Loss": 0.9378836847234655, "avg t": 0.9219681183850323, "plain loss": 0.09708736180022923, "standard loss": 0.06867994413221323}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.11666870117188, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.21716666666667, "Augmented-Loss": 0.06785210485974948, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.051100895375013354, "PGD-Accuracy": 1.9166666666666667, "PGD-Loss": 5.8431031697591145}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 109, "Epoch-Time": 242.21027779579163, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.8499984741211, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.70999908447266, "Augmented-Accuracy": 99.189, "Augmented-Loss": 0.06843577301681042, "Clean-Accuracy": 99.29, "Clean-Loss": 0.050474925696849825, "PGD-Accuracy": 1.5, "PGD-Loss": 6.037852587890625}, "Total-Time": 25507.828503608704, "Train": {"Loss": 0.937855525193391, "avg t": 0.9219726801448398, "plain loss": 0.09582801373976249, "standard loss": 0.06848456900428843}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.73332977294922, "Augmented-Accuracy": 99.20666666666666, "Augmented-Loss": 0.06436123334358136, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04830331891775131, "PGD-Accuracy": 1.65, "PGD-Loss": 6.03328103129069}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 110, "Epoch-Time": 241.93882822990417, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79999542236328, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.1923, "Augmented-Loss": 0.07238988546848298, "Clean-Accuracy": 99.27, "Clean-Loss": 0.053406607151031495, "PGD-Accuracy": 1.55, "PGD-Loss": 6.1528349761962895}, "Total-Time": 25749.767331838608, "Train": {"Loss": 0.9379096758807147, "avg t": 0.9219781787307174, "plain loss": 0.09539503680511748, "standard loss": 0.06778169812317247}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.25, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.14783333333334, "Augmented-Loss": 0.06892457544724147, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05176942381262779, "PGD-Accuracy": 1.8666666666666667, "PGD-Loss": 6.047295084635417}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 111, "Epoch-Time": 241.89584922790527, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.98999786376953, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.79000091552734, "Augmented-Accuracy": 99.1724, "Augmented-Loss": 0.07219221803069115, "Clean-Accuracy": 99.28, "Clean-Loss": 0.05303959152698517, "PGD-Accuracy": 1.28, "PGD-Loss": 5.788435479736328}, "Total-Time": 25991.663181066513, "Train": {"Loss": 0.9378565307193332, "avg t": 0.9219735096825493, "plain loss": 0.09394377086074267, "standard loss": 0.06571867909806746}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.25, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.20866666666667, "Augmented-Loss": 0.06799846882681052, "Clean-Accuracy": 99.21666666666667, "Clean-Loss": 0.05097856558362643, "PGD-Accuracy": 1.3333333333333333, "PGD-Loss": 5.677254686991374}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 112, "Epoch-Time": 239.2989490032196, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97000122070312, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2516, "Augmented-Loss": 0.0775869036052227, "Clean-Accuracy": 99.37, "Clean-Loss": 0.05539840281009674, "PGD-Accuracy": 1.08, "PGD-Loss": 5.948688330078125}, "Total-Time": 26230.962130069733, "Train": {"Loss": 0.9378996618058947, "avg t": 0.9219748426366735, "plain loss": 0.09502721924605192, "standard loss": 0.06695329168990806}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.249, "Augmented-Loss": 0.07289833342750868, "Clean-Accuracy": 99.35, "Clean-Loss": 0.05324223526318868, "PGD-Accuracy": 1.3, "PGD-Loss": 5.824343821207682}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 113, "Epoch-Time": 202.47718739509583, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.81999969482422, "Augmented-0.05-Quantile-Accuracy": 98.50999450683594, "Augmented-0.1-Quantile-Accuracy": 98.77999877929688, "Augmented-Accuracy": 99.2236, "Augmented-Loss": 0.07344412014722825, "Clean-Accuracy": 99.34, "Clean-Loss": 0.053094366812706, "PGD-Accuracy": 1.48, "PGD-Loss": 5.914644445800781}, "Total-Time": 26433.43931746483, "Train": {"Loss": 0.9378550139533149, "avg t": 0.9219660937697799, "plain loss": 0.09432692805042972, "standard loss": 0.06560992074895788}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.15566666666666, "Augmented-Loss": 0.06994102647682031, "Clean-Accuracy": 99.25, "Clean-Loss": 0.05170948550105095, "PGD-Accuracy": 2.05, "PGD-Loss": 5.821913650512696}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 114, "Epoch-Time": 227.85375308990479, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.91999816894531, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.75999450683594, "Augmented-Accuracy": 99.1848, "Augmented-Loss": 0.06782142963564396, "Clean-Accuracy": 99.26, "Clean-Loss": 0.049729135870933534, "PGD-Accuracy": 1.76, "PGD-Loss": 5.949825302124023}, "Total-Time": 26661.293070554733, "Train": {"Loss": 0.9379087236192492, "avg t": 0.9219731743600633, "plain loss": 0.09605311056243039, "standard loss": 0.06611892382966147}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.17016666666666, "Augmented-Loss": 0.06456291064163049, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.04849312054117521, "PGD-Accuracy": 2.15, "PGD-Loss": 5.857946873982748}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 115, "Epoch-Time": 242.12037301063538, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97000122070312, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.79000091552734, "Augmented-Accuracy": 99.1986, "Augmented-Loss": 0.07553570152163505, "Clean-Accuracy": 99.29, "Clean-Loss": 0.054379318249225615, "PGD-Accuracy": 1.44, "PGD-Loss": 5.7429356842041015}, "Total-Time": 26903.41344356537, "Train": {"Loss": 0.9378905916743808, "avg t": 0.9219702896542019, "plain loss": 0.09682079021312574, "standard loss": 0.06796542559508924}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.23833333333333, "Augmented-Loss": 0.07132574640731017, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.05237563562393188, "PGD-Accuracy": 1.6333333333333333, "PGD-Loss": 5.665787719726563}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 116, "Epoch-Time": 242.17878890037537, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.95999908447266, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.77999877929688, "Augmented-Accuracy": 99.1873, "Augmented-Loss": 0.07077615864396096, "Clean-Accuracy": 99.28, "Clean-Loss": 0.05125827913284302, "PGD-Accuracy": 1.61, "PGD-Loss": 5.929812872314453}, "Total-Time": 27145.592232465744, "Train": {"Loss": 0.9379023274315728, "avg t": 0.9219735273431848, "plain loss": 0.09745686779022207, "standard loss": 0.0681940715710322}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.24116666666667, "Augmented-Loss": 0.06681912758767605, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.049422522763411206, "PGD-Accuracy": 1.6833333333333333, "PGD-Loss": 5.836021886189779}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 117, "Epoch-Time": 242.20581817626953, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.73999786376953, "Augmented-0.05-Quantile-Accuracy": 98.3499984741211, "Augmented-0.1-Quantile-Accuracy": 98.58999633789062, "Augmented-Accuracy": 99.1301, "Augmented-Loss": 0.06819404332172871, "Clean-Accuracy": 99.23, "Clean-Loss": 0.05098633041381836, "PGD-Accuracy": 1.75, "PGD-Loss": 5.940486428833008}, "Total-Time": 27387.798050642014, "Train": {"Loss": 0.9378947229738589, "avg t": 0.9219806673438461, "plain loss": 0.09269700302901088, "standard loss": 0.06409457263460866}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.06666564941406, "Augmented-0.05-Quantile-Accuracy": 98.54999542236328, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.21566666666666, "Augmented-Loss": 0.06315209056138993, "Clean-Accuracy": 99.35, "Clean-Loss": 0.04790218754609426, "PGD-Accuracy": 2.433333333333333, "PGD-Loss": 5.804356618245443}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 118, "Epoch-Time": 209.5255880355835, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.75999450683594, "Augmented-Accuracy": 99.221, "Augmented-Loss": 0.0751193270418644, "Clean-Accuracy": 99.31, "Clean-Loss": 0.05459287155866623, "PGD-Accuracy": 1.43, "PGD-Loss": 5.798108432006836}, "Total-Time": 27597.323638677597, "Train": {"Loss": 0.9378669686140837, "avg t": 0.9219691215091281, "plain loss": 0.09533657701986817, "standard loss": 0.0667532236929293}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.11666870117188, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.20866666666667, "Augmented-Loss": 0.0701419798151652, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05181351351737976, "PGD-Accuracy": 1.5, "PGD-Loss": 5.7370833384195965}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 119, "Epoch-Time": 217.1172001361847, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0199966430664, "Augmented-0.05-Quantile-Accuracy": 98.55999755859375, "Augmented-0.1-Quantile-Accuracy": 98.75999450683594, "Augmented-Accuracy": 99.2291, "Augmented-Loss": 0.0651855165708065, "Clean-Accuracy": 99.32, "Clean-Loss": 0.04709944285750389, "PGD-Accuracy": 1.03, "PGD-Loss": 6.217799966430664}, "Total-Time": 27814.44083881378, "Train": {"Loss": 0.9378408217959934, "avg t": 0.9219626207704897, "plain loss": 0.09545448783591927, "standard loss": 0.06717473553728175}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.9000015258789, "Augmented-Accuracy": 99.221, "Augmented-Loss": 0.062376863454679646, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04643553886810939, "PGD-Accuracy": 1.2333333333333334, "PGD-Loss": 6.043687825520833}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 120, "Epoch-Time": 242.0649847984314, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.87999725341797, "Augmented-0.05-Quantile-Accuracy": 98.54000091552734, "Augmented-0.1-Quantile-Accuracy": 98.77999877929688, "Augmented-Accuracy": 99.2131, "Augmented-Loss": 0.06929192118346691, "Clean-Accuracy": 99.29, "Clean-Loss": 0.04919762353897095, "PGD-Accuracy": 1.56, "PGD-Loss": 5.957987115478516}, "Total-Time": 28056.505823612213, "Train": {"Loss": 0.9378264488997283, "avg t": 0.9219567469490899, "plain loss": 0.08888317030800712, "standard loss": 0.06108786020234779}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.03333282470703, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.18216666666666, "Augmented-Loss": 0.06708998764952023, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04946048507094383, "PGD-Accuracy": 1.7166666666666666, "PGD-Loss": 5.9251646779378255}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 121, "Epoch-Time": 242.07599902153015, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.89999389648438, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.79000091552734, "Augmented-Accuracy": 99.2097, "Augmented-Loss": 0.06038856270766258, "Clean-Accuracy": 99.29, "Clean-Loss": 0.04267131121754646, "PGD-Accuracy": 1.64, "PGD-Loss": 6.066829592895508}, "Total-Time": 28298.581822633743, "Train": {"Loss": 0.937884382919029, "avg t": 0.9219643576586688, "plain loss": 0.09033096915527636, "standard loss": 0.06144809849836208}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.11666870117188, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.1955, "Augmented-Loss": 0.05773875444660584, "Clean-Accuracy": 99.3, "Clean-Loss": 0.0423662750373284, "PGD-Accuracy": 1.7833333333333334, "PGD-Loss": 5.972785827636719}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 122, "Epoch-Time": 242.18857622146606, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.04999542236328, "Augmented-0.05-Quantile-Accuracy": 98.61000061035156, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2143, "Augmented-Loss": 0.06607449919867515, "Clean-Accuracy": 99.3, "Clean-Loss": 0.046654665857553484, "PGD-Accuracy": 1.31, "PGD-Loss": 5.996904434204102}, "Total-Time": 28540.77039885521, "Train": {"Loss": 0.9378889775629397, "avg t": 0.9219636723553692, "plain loss": 0.0890904881159465, "standard loss": 0.06085120374405826}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.88333129882812, "Augmented-Accuracy": 99.22883333333333, "Augmented-Loss": 0.06354905894656976, "Clean-Accuracy": 99.3, "Clean-Loss": 0.0463667537967364, "PGD-Accuracy": 1.5333333333333334, "PGD-Loss": 5.907456522623698}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 123, "Epoch-Time": 239.3799066543579, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.5999984741211, "Augmented-0.05-Quantile-Accuracy": 98.33999633789062, "Augmented-0.1-Quantile-Accuracy": 98.6199951171875, "Augmented-Accuracy": 99.1784, "Augmented-Loss": 0.07970781396555901, "Clean-Accuracy": 99.27, "Clean-Loss": 0.05695220067501068, "PGD-Accuracy": 1.63, "PGD-Loss": 5.726959646606446}, "Total-Time": 28780.150305509567, "Train": {"Loss": 0.937864057470251, "avg t": 0.9219653319782681, "plain loss": 0.0942630662988733, "standard loss": 0.06435351420111127}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.08333587646484, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.20333333333333, "Augmented-Loss": 0.07354937885383765, "Clean-Accuracy": 99.26666666666667, "Clean-Loss": 0.053702125132083896, "PGD-Accuracy": 2.066666666666667, "PGD-Loss": 5.672346405029296}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 124, "Epoch-Time": 200.19180965423584, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.00999450683594, "Augmented-0.05-Quantile-Accuracy": 98.65999603271484, "Augmented-0.1-Quantile-Accuracy": 98.83999633789062, "Augmented-Accuracy": 99.2147, "Augmented-Loss": 0.0704296865978241, "Clean-Accuracy": 99.25, "Clean-Loss": 0.050605759501457216, "PGD-Accuracy": 1.58, "PGD-Loss": 5.857890869140625}, "Total-Time": 28980.342115163803, "Train": {"Loss": 0.9378718395586367, "avg t": 0.9219723437980369, "plain loss": 0.09340793376498757, "standard loss": 0.06436696952802164}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.16666412353516, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.94999694824219, "Augmented-Accuracy": 99.22416666666666, "Augmented-Loss": 0.06691275417208671, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.04918186789751053, "PGD-Accuracy": 1.85, "PGD-Loss": 5.8309795201619465}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 125, "Epoch-Time": 230.27503204345703, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0199966430664, "Augmented-0.05-Quantile-Accuracy": 98.6199951171875, "Augmented-0.1-Quantile-Accuracy": 98.80999755859375, "Augmented-Accuracy": 99.2625, "Augmented-Loss": 0.07156443254542351, "Clean-Accuracy": 99.36, "Clean-Loss": 0.04997923936843872, "PGD-Accuracy": 1.6, "PGD-Loss": 5.834586190795898}, "Total-Time": 29210.61714720726, "Train": {"Loss": 0.9378768079015943, "avg t": 0.9219639542191117, "plain loss": 0.08991146943834097, "standard loss": 0.06062667071157032}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.20083333333334, "Augmented-Loss": 0.06842543746848902, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.049247242013613385, "PGD-Accuracy": 1.85, "PGD-Loss": 5.788813446044922}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 126, "Epoch-Time": 242.05301809310913, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.00999450683594, "Augmented-0.05-Quantile-Accuracy": 98.5199966430664, "Augmented-0.1-Quantile-Accuracy": 98.79000091552734, "Augmented-Accuracy": 99.2346, "Augmented-Loss": 0.062254700478196145, "Clean-Accuracy": 99.35, "Clean-Loss": 0.04501502335071564, "PGD-Accuracy": 1.15, "PGD-Loss": 6.276568542480469}, "Total-Time": 29452.67016530037, "Train": {"Loss": 0.9378496532793398, "avg t": 0.9219609038035075, "plain loss": 0.09219723210158175, "standard loss": 0.06389143775569069}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.20233333333333, "Augmented-Loss": 0.06058113495737314, "Clean-Accuracy": 99.25, "Clean-Loss": 0.04544619299471378, "PGD-Accuracy": 1.3666666666666667, "PGD-Loss": 6.193214833577474}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 127, "Epoch-Time": 241.88700580596924, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.72999572753906, "Augmented-0.05-Quantile-Accuracy": 98.41999816894531, "Augmented-0.1-Quantile-Accuracy": 98.68000030517578, "Augmented-Accuracy": 99.1558, "Augmented-Loss": 0.08107609193277358, "Clean-Accuracy": 99.19, "Clean-Loss": 0.058517727553844455, "PGD-Accuracy": 2.45, "PGD-Loss": 5.5654655487060545}, "Total-Time": 29694.55717110634, "Train": {"Loss": 0.9379120994144016, "avg t": 0.9219685445361667, "plain loss": 0.09391928238338883, "standard loss": 0.06414341510887499}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.58333587646484, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.17933333333333, "Augmented-Loss": 0.07623832069575787, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.055778883934020994, "PGD-Accuracy": 2.8, "PGD-Loss": 5.5199976043701175}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 128, "Epoch-Time": 242.06146931648254, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.02999877929688, "Augmented-0.05-Quantile-Accuracy": 98.56999969482422, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.1944, "Augmented-Loss": 0.06536604249751568, "Clean-Accuracy": 99.24, "Clean-Loss": 0.04768476415872574, "PGD-Accuracy": 1.49, "PGD-Loss": 5.807564007568359}, "Total-Time": 29936.61864042282, "Train": {"Loss": 0.9378656942226269, "avg t": 0.9219631031884088, "plain loss": 0.09380146871319528, "standard loss": 0.06585575722323524}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.66666412353516, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.21533333333333, "Augmented-Loss": 0.06229109713176886, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.04672223512331645, "PGD-Accuracy": 1.95, "PGD-Loss": 5.668912562052409}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 129, "Epoch-Time": 206.1608612537384, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.95999908447266, "Augmented-0.05-Quantile-Accuracy": 98.55999755859375, "Augmented-0.1-Quantile-Accuracy": 98.80999755859375, "Augmented-Accuracy": 99.2231, "Augmented-Loss": 0.06820246048176289, "Clean-Accuracy": 99.35, "Clean-Loss": 0.048603423023223874, "PGD-Accuracy": 1.29, "PGD-Loss": 5.8682924774169924}, "Total-Time": 30142.77950167656, "Train": {"Loss": 0.9378397928167272, "avg t": 0.9219614743833189, "plain loss": 0.09073793293281827, "standard loss": 0.06266808642502185}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.68333435058594, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.22416666666666, "Augmented-Loss": 0.06470117922862371, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.04726661478479703, "PGD-Accuracy": 1.6, "PGD-Loss": 5.809160985310872}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 130, "Epoch-Time": 194.14664673805237, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97999572753906, "Augmented-0.05-Quantile-Accuracy": 98.56999969482422, "Augmented-0.1-Quantile-Accuracy": 98.8499984741211, "Augmented-Accuracy": 99.2155, "Augmented-Loss": 0.06411603985238075, "Clean-Accuracy": 99.28, "Clean-Loss": 0.045461418950557705, "PGD-Accuracy": 1.43, "PGD-Loss": 5.881500869750977}, "Total-Time": 30336.92614841461, "Train": {"Loss": 0.9378758211135865, "avg t": 0.9219615114706534, "plain loss": 0.09175397431232317, "standard loss": 0.06187392494303209}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.18333435058594, "Augmented-0.05-Quantile-Accuracy": 98.53333282470703, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.18166666666667, "Augmented-Loss": 0.06155442549486955, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.04506314184268315, "PGD-Accuracy": 1.6833333333333333, "PGD-Loss": 5.792916865030924}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 131, "Epoch-Time": 104.31332612037659, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.04999542236328, "Augmented-0.05-Quantile-Accuracy": 98.56999969482422, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2349, "Augmented-Loss": 0.06435688663363456, "Clean-Accuracy": 99.34, "Clean-Loss": 0.04605042607784271, "PGD-Accuracy": 1.39, "PGD-Loss": 5.784059512329102}, "Total-Time": 30441.23947453499, "Train": {"Loss": 0.9378650914651376, "avg t": 0.9219617544809977, "plain loss": 0.093322262011634, "standard loss": 0.06426797069885112}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.22566666666667, "Augmented-Loss": 0.06104428517301878, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.045039609909057615, "PGD-Accuracy": 1.7, "PGD-Loss": 5.757162923177083}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 132, "Epoch-Time": 104.29311442375183, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.04999542236328, "Augmented-0.05-Quantile-Accuracy": 98.54000091552734, "Augmented-0.1-Quantile-Accuracy": 98.77999877929688, "Augmented-Accuracy": 99.2357, "Augmented-Loss": 0.06687776774013042, "Clean-Accuracy": 99.35, "Clean-Loss": 0.04765790470838547, "PGD-Accuracy": 1.7, "PGD-Loss": 5.836320288085937}, "Total-Time": 30545.53258895874, "Train": {"Loss": 0.9378464660114713, "avg t": 0.9219607306586372, "plain loss": 0.093965550576316, "standard loss": 0.06523986474562574}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.23332977294922, "Augmented-0.05-Quantile-Accuracy": 98.71666717529297, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.23666666666666, "Augmented-Loss": 0.0634396598537763, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04642621713876724, "PGD-Accuracy": 1.8833333333333333, "PGD-Loss": 5.710666061401367}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 133, "Epoch-Time": 105.23147511482239, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79000091552734, "Augmented-0.05-Quantile-Accuracy": 98.47999572753906, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.2014, "Augmented-Loss": 0.06657210289096832, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04882298420071602, "PGD-Accuracy": 2.23, "PGD-Loss": 5.827911672973633}, "Total-Time": 30650.764064073563, "Train": {"Loss": 0.9378240003232603, "avg t": 0.9219614840790078, "plain loss": 0.0912870936411399, "standard loss": 0.06385072309882553}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.28333282470703, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.2625, "Augmented-Loss": 0.06302895051956177, "Clean-Accuracy": 99.33333333333333, "Clean-Loss": 0.04713410409291585, "PGD-Accuracy": 2.75, "PGD-Loss": 5.797201807657878}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 134, "Epoch-Time": 104.95263481140137, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.89999389648438, "Augmented-0.05-Quantile-Accuracy": 98.48999786376953, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1956, "Augmented-Loss": 0.07168277431511878, "Clean-Accuracy": 99.31, "Clean-Loss": 0.05157366666793823, "PGD-Accuracy": 1.62, "PGD-Loss": 5.796347241210937}, "Total-Time": 30755.716698884964, "Train": {"Loss": 0.9378161662066424, "avg t": 0.9219524738876907, "plain loss": 0.0889647189811425, "standard loss": 0.06202430868811078}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.81666564941406, "Augmented-Accuracy": 99.196, "Augmented-Loss": 0.0687036666148901, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.05078447971741359, "PGD-Accuracy": 2.033333333333333, "PGD-Loss": 5.727170819600423}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 135, "Epoch-Time": 105.18056559562683, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.95999908447266, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.1552, "Augmented-Loss": 0.06824864134168625, "Clean-Accuracy": 99.21, "Clean-Loss": 0.05031427081823349, "PGD-Accuracy": 1.13, "PGD-Loss": 6.1085353790283206}, "Total-Time": 30860.89726448059, "Train": {"Loss": 0.9378058902599193, "avg t": 0.9219545100176776, "plain loss": 0.08809391453531051, "standard loss": 0.06092088587416543}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.1500015258789, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.14066666666666, "Augmented-Loss": 0.06628805270234744, "Clean-Accuracy": 99.2, "Clean-Loss": 0.05022064266602198, "PGD-Accuracy": 1.4666666666666666, "PGD-Loss": 6.022600306193034}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 136, "Epoch-Time": 105.5512318611145, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.82999420166016, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.2045, "Augmented-Loss": 0.0696843737807274, "Clean-Accuracy": 99.29, "Clean-Loss": 0.050073739182949065, "PGD-Accuracy": 1.51, "PGD-Loss": 6.041196115112305}, "Total-Time": 30966.448496341705, "Train": {"Loss": 0.9378241311532479, "avg t": 0.921959275563558, "plain loss": 0.08983451724582249, "standard loss": 0.06234088325058972}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.19999694824219, "Augmented-0.05-Quantile-Accuracy": 98.56666564941406, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.17, "Augmented-Loss": 0.06579843673586845, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.04853667637705803, "PGD-Accuracy": 1.6, "PGD-Loss": 6.0585012563069665}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 137, "Epoch-Time": 105.32648873329163, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.87999725341797, "Augmented-0.05-Quantile-Accuracy": 98.50999450683594, "Augmented-0.1-Quantile-Accuracy": 98.68999481201172, "Augmented-Accuracy": 99.2035, "Augmented-Loss": 0.06682947631442547, "Clean-Accuracy": 99.31, "Clean-Loss": 0.04830189927816391, "PGD-Accuracy": 1.45, "PGD-Loss": 5.794079058837891}, "Total-Time": 31071.774985074997, "Train": {"Loss": 0.9378718558064213, "avg t": 0.9219630353715684, "plain loss": 0.09030529901010018, "standard loss": 0.06223689987482848}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.207, "Augmented-Loss": 0.06405032311975956, "Clean-Accuracy": 99.28333333333333, "Clean-Loss": 0.04782156784335772, "PGD-Accuracy": 1.5333333333333334, "PGD-Loss": 5.781679987589518}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 138, "Epoch-Time": 105.74968647956848, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.0199966430664, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.80999755859375, "Augmented-Accuracy": 99.2518, "Augmented-Loss": 0.06796235612213612, "Clean-Accuracy": 99.31, "Clean-Loss": 0.049692464578151706, "PGD-Accuracy": 1.64, "PGD-Loss": 5.8309047943115235}, "Total-Time": 31177.524671554565, "Train": {"Loss": 0.9378355781413891, "avg t": 0.9219519350440414, "plain loss": 0.09099283986974648, "standard loss": 0.06301530396938324}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.76666259765625, "Augmented-Accuracy": 99.23066666666666, "Augmented-Loss": 0.06497615258594354, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.04864655533432961, "PGD-Accuracy": 1.9166666666666667, "PGD-Loss": 5.763423746744792}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 139, "Epoch-Time": 105.80484819412231, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.88999938964844, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.72999572753906, "Augmented-Accuracy": 99.1693, "Augmented-Loss": 0.06634492589819431, "Clean-Accuracy": 99.26, "Clean-Loss": 0.0488017883002758, "PGD-Accuracy": 1.8, "PGD-Loss": 5.735050183105469}, "Total-Time": 31283.329519748688, "Train": {"Loss": 0.9377934755572567, "avg t": 0.9219521762706615, "plain loss": 0.089660203633485, "standard loss": 0.061600885943130214}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.13333129882812, "Augmented-0.05-Quantile-Accuracy": 98.6500015258789, "Augmented-0.1-Quantile-Accuracy": 98.83333587646484, "Augmented-Accuracy": 99.16683333333333, "Augmented-Loss": 0.062752302215, "Clean-Accuracy": 99.2, "Clean-Loss": 0.04742803031206131, "PGD-Accuracy": 1.8833333333333333, "PGD-Loss": 5.675941650390625}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 140, "Epoch-Time": 105.44021320343018, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.98999786376953, "Augmented-0.05-Quantile-Accuracy": 98.66999816894531, "Augmented-0.1-Quantile-Accuracy": 98.86000061035156, "Augmented-Accuracy": 99.2442, "Augmented-Loss": 0.06301985898673534, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04539037853479386, "PGD-Accuracy": 1.39, "PGD-Loss": 5.890847998046875}, "Total-Time": 31388.769732952118, "Train": {"Loss": 0.9378287760416667, "avg t": 0.9219579524287471, "plain loss": 0.08602742580661075, "standard loss": 0.059104336935060994}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.33333587646484, "Augmented-0.05-Quantile-Accuracy": 98.78333282470703, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.23433333333334, "Augmented-Loss": 0.05978244534214338, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04426893763740857, "PGD-Accuracy": 1.6833333333333333, "PGD-Loss": 5.824365580240886}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 141, "Epoch-Time": 105.06299042701721, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97000122070312, "Augmented-0.05-Quantile-Accuracy": 98.47000122070312, "Augmented-0.1-Quantile-Accuracy": 98.75, "Augmented-Accuracy": 99.1691, "Augmented-Loss": 0.0691321338160038, "Clean-Accuracy": 99.26, "Clean-Loss": 0.04972245703339577, "PGD-Accuracy": 1.95, "PGD-Loss": 5.774964184570313}, "Total-Time": 31493.832723379135, "Train": {"Loss": 0.9378114452715274, "avg t": 0.9219573541570593, "plain loss": 0.0904926670445337, "standard loss": 0.06205969202739221}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.31666564941406, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.86666870117188, "Augmented-Accuracy": 99.18, "Augmented-Loss": 0.06597812155465285, "Clean-Accuracy": 99.2, "Clean-Loss": 0.048853875974814095, "PGD-Accuracy": 1.9166666666666667, "PGD-Loss": 5.7613669230143225}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 142, "Epoch-Time": 106.76589393615723, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.79999542236328, "Augmented-0.05-Quantile-Accuracy": 98.45999908447266, "Augmented-0.1-Quantile-Accuracy": 98.69999694824219, "Augmented-Accuracy": 99.188, "Augmented-Loss": 0.08001094597291947, "Clean-Accuracy": 99.28, "Clean-Loss": 0.058183907389640806, "PGD-Accuracy": 1.63, "PGD-Loss": 5.643444830322266}, "Total-Time": 31600.598617315292, "Train": {"Loss": 0.9378872077553361, "avg t": 0.9219620038491708, "plain loss": 0.09471689458069976, "standard loss": 0.06548660672814757}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.0999984741211, "Augmented-0.05-Quantile-Accuracy": 98.5999984741211, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.22666666666667, "Augmented-Loss": 0.07476948326528073, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.05530331136782964, "PGD-Accuracy": 1.9833333333333334, "PGD-Loss": 5.526431681315104}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 143, "Epoch-Time": 106.33626747131348, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.00999450683594, "Augmented-0.05-Quantile-Accuracy": 98.44999694824219, "Augmented-0.1-Quantile-Accuracy": 98.72000122070312, "Augmented-Accuracy": 99.2314, "Augmented-Loss": 0.07077062035608292, "Clean-Accuracy": 99.27, "Clean-Loss": 0.050583244776725766, "PGD-Accuracy": 1.62, "PGD-Loss": 5.7218405059814454}, "Total-Time": 31706.934884786606, "Train": {"Loss": 0.9378616866359004, "avg t": 0.9219558708049633, "plain loss": 0.09209026137457953, "standard loss": 0.06420311201501776}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.75, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.28016666666667, "Augmented-Loss": 0.06632509362121423, "Clean-Accuracy": 99.38333333333334, "Clean-Loss": 0.048411727219820025, "PGD-Accuracy": 1.9166666666666667, "PGD-Loss": 5.652972918192545}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 144, "Epoch-Time": 105.23447012901306, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97999572753906, "Augmented-0.05-Quantile-Accuracy": 98.55999755859375, "Augmented-0.1-Quantile-Accuracy": 98.79000091552734, "Augmented-Accuracy": 99.223, "Augmented-Loss": 0.0720354536254406, "Clean-Accuracy": 99.34, "Clean-Loss": 0.051643535268306735, "PGD-Accuracy": 1.41, "PGD-Loss": 5.8315817016601565}, "Total-Time": 31812.16935491562, "Train": {"Loss": 0.9378369065390693, "avg t": 0.9219588214732982, "plain loss": 0.09225918345981168, "standard loss": 0.06362583013154842}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.79999542236328, "Augmented-0.1-Quantile-Accuracy": 98.93333435058594, "Augmented-Accuracy": 99.21366666666667, "Augmented-Loss": 0.06854098613580067, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.050387765010197955, "PGD-Accuracy": 1.6, "PGD-Loss": 5.746067759195964}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 145, "Epoch-Time": 105.04575538635254, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.04000091552734, "Augmented-0.05-Quantile-Accuracy": 98.52999877929688, "Augmented-0.1-Quantile-Accuracy": 98.70999908447266, "Augmented-Accuracy": 99.207, "Augmented-Loss": 0.0637737633023262, "Clean-Accuracy": 99.31, "Clean-Loss": 0.0464686331152916, "PGD-Accuracy": 1.59, "PGD-Loss": 6.004141363525391}, "Total-Time": 31917.21511030197, "Train": {"Loss": 0.9378658014403449, "avg t": 0.9219641150015372, "plain loss": 0.08989875305670272, "standard loss": 0.062322695072050446}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.26666259765625, "Augmented-0.05-Quantile-Accuracy": 98.63333129882812, "Augmented-0.1-Quantile-Accuracy": 98.78333282470703, "Augmented-Accuracy": 99.18966666666667, "Augmented-Loss": 0.0609928826679786, "Clean-Accuracy": 99.23333333333333, "Clean-Loss": 0.04590840723613898, "PGD-Accuracy": 2.05, "PGD-Loss": 5.903400583902995}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 146, "Epoch-Time": 106.7180724143982, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.06999969482422, "Augmented-0.05-Quantile-Accuracy": 98.6199951171875, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2474, "Augmented-Loss": 0.06788082689046859, "Clean-Accuracy": 99.33, "Clean-Loss": 0.0486509948849678, "PGD-Accuracy": 1.26, "PGD-Loss": 6.048602014160156}, "Total-Time": 32023.93318271637, "Train": {"Loss": 0.9378116337811505, "avg t": 0.9219551269036752, "plain loss": 0.08825116800025666, "standard loss": 0.06074446371087321}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.29999542236328, "Augmented-0.05-Quantile-Accuracy": 98.81666564941406, "Augmented-0.1-Quantile-Accuracy": 98.94999694824219, "Augmented-Accuracy": 99.25633333333333, "Augmented-Loss": 0.06464364696204662, "Clean-Accuracy": 99.31666666666666, "Clean-Loss": 0.047379559884468715, "PGD-Accuracy": 1.4666666666666666, "PGD-Loss": 6.009472152709961}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 147, "Epoch-Time": 107.52967977523804, "Test": {"Augmented-0.01-Quantile-Accuracy": 98.08999633789062, "Augmented-0.05-Quantile-Accuracy": 98.61000061035156, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2429, "Augmented-Loss": 0.0633277208930254, "Clean-Accuracy": 99.36, "Clean-Loss": 0.044909353053569794, "PGD-Accuracy": 1.07, "PGD-Loss": 6.092453524780273}, "Total-Time": 32131.462862491608, "Train": {"Loss": 0.9378556431664361, "avg t": 0.9219593515042905, "plain loss": 0.08641212455608217, "standard loss": 0.06025033344383593}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.3499984741211, "Augmented-0.05-Quantile-Accuracy": 98.76666259765625, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.27383333333333, "Augmented-Loss": 0.06010146706342697, "Clean-Accuracy": 99.38333333333334, "Clean-Loss": 0.04350526609023412, "PGD-Accuracy": 1.05, "PGD-Loss": 6.03518158976237}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 148, "Epoch-Time": 106.24145936965942, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.97000122070312, "Augmented-0.05-Quantile-Accuracy": 98.61000061035156, "Augmented-0.1-Quantile-Accuracy": 98.79999542236328, "Augmented-Accuracy": 99.2614, "Augmented-Loss": 0.06700670507645606, "Clean-Accuracy": 99.38, "Clean-Loss": 0.04775641129016876, "PGD-Accuracy": 1.63, "PGD-Loss": 5.600126193237305}, "Total-Time": 32237.704321861267, "Train": {"Loss": 0.9378806522863883, "avg t": 0.9219622259493228, "plain loss": 0.09017894479080481, "standard loss": 0.06057870475009636}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.38333129882812, "Augmented-0.05-Quantile-Accuracy": 98.73332977294922, "Augmented-0.1-Quantile-Accuracy": 98.91666412353516, "Augmented-Accuracy": 99.269, "Augmented-Loss": 0.06311203807810942, "Clean-Accuracy": 99.36666666666666, "Clean-Loss": 0.046060689995686216, "PGD-Accuracy": 1.7666666666666666, "PGD-Loss": 5.575774663289388}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
{"Epoch": 149, "Epoch-Time": 70.44163250923157, "Test": {"Augmented-0.01-Quantile-Accuracy": 97.81999969482422, "Augmented-0.05-Quantile-Accuracy": 98.57999420166016, "Augmented-0.1-Quantile-Accuracy": 98.73999786376953, "Augmented-Accuracy": 99.2074, "Augmented-Loss": 0.06760171625757218, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04790483803749084, "PGD-Accuracy": 1.83, "PGD-Loss": 5.714683831787109}, "Total-Time": 32308.1459543705, "Train": {"Loss": 0.9378560078232376, "avg t": 0.9219542881294533, "plain loss": 0.09039122071795987, "standard loss": 0.060939735801131635}, "Validation": {"Augmented-0.01-Quantile-Accuracy": 98.21666717529297, "Augmented-0.05-Quantile-Accuracy": 98.69999694824219, "Augmented-0.1-Quantile-Accuracy": 98.94999694824219, "Augmented-Accuracy": 99.23333333333333, "Augmented-Loss": 0.0632182778546214, "Clean-Accuracy": 99.3, "Clean-Loss": 0.04566162308057149, "PGD-Accuracy": 1.9666666666666666, "PGD-Loss": 5.632088521321615}, "args": {"algorithm": "CVaR_Modified_SGD", "batch_size": null, "cvar_sgd_M": null, "cvar_sgd_beta": 0.5, "cvar_sgd_t_step_size": 1.0, "data_dir": "./advbench/data", "dataset": "MNIST", "device": "cuda:0", "epsilon": null, "evaluators": ["Clean", "PGD", "Augmented"], "hparams": null, "hparams_seed": 0, "learning_rate": null, "model": null, "output_dir": "rep_five/mnist_mod_050", "save_model_every_epoch": false, "seed": 0, "trial_seed": 0}, "hparams": {"batch_size": 64, "cvar_sgd_M": 20, "cvar_sgd_beta": 0.5, "cvar_sgd_n_steps": 5, "cvar_sgd_t_step_size": 1.0, "epsilon": 0.3, "g_dale_n_steps": 7, "g_dale_noise_coeff": 0.001, "g_dale_nu": 0.1, "g_dale_pd_margin": 0.1, "g_dale_pd_step_size": 0.001, "g_dale_step_size": 0.1, "l_dale_n_steps": 7, "l_dale_noise_coeff": 0.001, "l_dale_nu": 0.1, "l_dale_step_size": 0.1, "learning_rate": 1.0, "mart_beta": 5.0, "optimizer": 0, "pgd_n_steps": 7, "pgd_step_size": 0.1, "rand_smoothing_n_samples": 10, "rand_smoothing_n_steps": 7, "rand_smoothing_sigma": 0.5, "rand_smoothing_step_size": 0.1, "term_t": 2.0, "trades_beta": 1.0, "trades_n_steps": 7, "trades_step_size": 0.1}}
