epoch,eval/num paths total,eval/num steps total,expl/Actions Max,expl/Actions Mean,expl/Actions Min,expl/Actions Std,expl/Average Returns,expl/Num Paths,expl/Returns Max,expl/Returns Mean,expl/Returns Min,expl/Returns Std,expl/Rewards Max,expl/Rewards Mean,expl/Rewards Min,expl/Rewards Std,expl/num paths total,expl/num steps total,expl/path length Max,expl/path length Mean,expl/path length Min,expl/path length Std,replay_buffer/size,time/epoch_time (s),time/evaluation sampling (s),time/exploration sampling (s),time/global_time (s),time/replay buffer data storing (s),time/saving (s),time/training (s),trainer/Advantage Score Max,trainer/Advantage Score Mean,trainer/Advantage Score Min,trainer/Advantage Score Std,trainer/Advantage Weights Max,trainer/Advantage Weights Mean,trainer/Advantage Weights Min,trainer/Advantage Weights Std,trainer/Policy Loss,trainer/Q Targets Max,trainer/Q Targets Mean,trainer/Q Targets Min,trainer/Q Targets Std,trainer/Q1 Predictions Max,trainer/Q1 Predictions Mean,trainer/Q1 Predictions Min,trainer/Q1 Predictions Std,trainer/Q2 Predictions Max,trainer/Q2 Predictions Mean,trainer/Q2 Predictions Min,trainer/Q2 Predictions Std,trainer/QF1 Loss,trainer/QF2 Loss,trainer/V1 Predictions Max,trainer/V1 Predictions Mean,trainer/V1 Predictions Min,trainer/V1 Predictions Std,trainer/VF Loss,trainer/num train calls,trainer/policy/mean Max,trainer/policy/mean Mean,trainer/policy/mean Min,trainer/policy/mean Std,trainer/policy/std Max,trainer/policy/std Mean,trainer/policy/std Min,trainer/policy/std Std,trainer/replay_buffer_len,trainer/rewards Max,trainer/rewards Mean,trainer/rewards Min,trainer/rewards Std,trainer/terminals Max,trainer/terminals Mean,trainer/terminals Min,trainer/terminals Std
-2,0,0,0.13717124,0.03626487,-0.049319427,0.045948837,-0.19655459402248504,1,-0.19655459402248504,-0.19655459402248504,-0.19655459402248504,0.0,-0.09325349516403507,-0.09827729701124252,-0.10330109885844999,0.005023801847207458,1,2,2,2.0,2,0.0,998999,0.7398281097412109,0.022743940353393555,0.0016701221466064453,20.234392166137695,1.9073486328125e-06,0.008835077285766602,0.7058250904083252,-0.0036168185,-0.008904904,-0.01419299,0.005288086,0.9892082,0.9737615,0.9583148,0.0154467225,857.7699,1.0095485,0.91235673,0.8151649,0.09719181,-3.695485e-05,-0.0023042315,-0.004571508,0.0022672766,0.0,0.0,0.0,0.0,0.8464968,0.84184104,0.01419299,0.007483647,0.0007743044,0.006709343,3.2178352e-05,100,0.004211932,0.0006116896,-0.0027325656,0.0019366256,0.049787067,0.049787063,0.049787067,3.7252903e-09,998999,1.0072821,0.90650094,0.80571973,0.1007812,0.0,0.0,0.0,0.0
-1,0,0,0.049955986,-0.051808134,-0.24854904,0.08398724,0.4338117202694962,1,0.4338117202694962,0.4338117202694962,0.4338117202694962,0.0,0.24300404877931653,0.2169058601347481,0.19080767149017966,0.026098188644568435,2,4,2,2.0,2,0.0,998999,0.6178200244903564,0.0024394989013671875,0.002116680145263672,20.855294704437256,1.6689300537109375e-06,0.008217334747314453,0.6044015884399414,-0.004432007,-0.0058829254,-0.0073338435,0.0014509181,0.98679197,0.98251534,0.97823876,0.0042766035,440.564,1.0878772,0.8795528,0.6712284,0.20832437,0.07119025,0.055561554,0.039932854,0.0156287,0.06366714,0.046736993,0.029806845,0.016930148,0.7160932,0.7302138,0.013697105,0.0122417575,0.0107864095,0.001455348,1.1014193e-05,200,-0.17424563,-0.48487774,-0.8831331,0.2023349,0.051678017,0.05148844,0.051258426,0.00012519717,998999,1.0813023,0.8714981,0.661694,0.20980415,0.0,0.0,0.0,0.0
