epoch,eval/num paths total,eval/num steps total,expl/Actions Max,expl/Actions Mean,expl/Actions Min,expl/Actions Std,expl/Average Returns,expl/Num Paths,expl/Returns Max,expl/Returns Mean,expl/Returns Min,expl/Returns Std,expl/Rewards Max,expl/Rewards Mean,expl/Rewards Min,expl/Rewards Std,expl/num paths total,expl/num steps total,expl/path length Max,expl/path length Mean,expl/path length Min,expl/path length Std,replay_buffer/size,time/epoch_time (s),time/evaluation sampling (s),time/exploration sampling (s),time/global_time (s),time/replay buffer data storing (s),time/saving (s),time/training (s),trainer/Advantage Score Max,trainer/Advantage Score Mean,trainer/Advantage Score Min,trainer/Advantage Score Std,trainer/Advantage Weights Max,trainer/Advantage Weights Mean,trainer/Advantage Weights Min,trainer/Advantage Weights Std,trainer/Policy Loss,trainer/Q Targets Max,trainer/Q Targets Mean,trainer/Q Targets Min,trainer/Q Targets Std,trainer/Q1 Predictions Max,trainer/Q1 Predictions Mean,trainer/Q1 Predictions Min,trainer/Q1 Predictions Std,trainer/Q2 Predictions Max,trainer/Q2 Predictions Mean,trainer/Q2 Predictions Min,trainer/Q2 Predictions Std,trainer/QF1 Loss,trainer/QF2 Loss,trainer/V1 Predictions Max,trainer/V1 Predictions Mean,trainer/V1 Predictions Min,trainer/V1 Predictions Std,trainer/VF Loss,trainer/num train calls,trainer/policy/mean Max,trainer/policy/mean Mean,trainer/policy/mean Min,trainer/policy/mean Std,trainer/policy/std Max,trainer/policy/std Mean,trainer/policy/std Min,trainer/policy/std Std,trainer/replay_buffer_len,trainer/rewards Max,trainer/rewards Mean,trainer/rewards Min,trainer/rewards Std,trainer/terminals Max,trainer/terminals Mean,trainer/terminals Min,trainer/terminals Std
-2,0,0,0.13717124,0.03626487,-0.049319427,0.045948837,-0.19655459402248504,1,-0.19655459402248504,-0.19655459402248504,-0.19655459402248504,0.0,-0.09325349516403507,-0.09827729701124252,-0.10330109885844999,0.005023801847207458,1,2,2,2.0,2,0.0,998999,0.7535736560821533,0.01971721649169922,0.0017578601837158203,20.90360975265503,2.384185791015625e-06,0.008637666702270508,0.7226138114929199,-0.0036168185,-0.008904904,-0.01419299,0.005288086,0.9892082,0.9737615,0.9583148,0.0154467225,857.7699,1.0095485,0.91235673,0.8151649,0.09719181,-3.695485e-05,-0.0023042315,-0.004571508,0.0022672766,0.0,0.0,0.0,0.0,0.8464968,0.84184104,0.01419299,0.007483647,0.0007743044,0.006709343,3.2178352e-05,100,0.004211932,0.0006116896,-0.0027325656,0.0019366256,0.049787067,0.049787063,0.049787067,3.7252903e-09,998999,1.0072821,0.90650094,0.80571973,0.1007812,0.0,0.0,0.0,0.0
-1,0,0,0.049955986,-0.051808134,-0.24854904,0.08398724,0.4338117202694962,1,0.4338117202694962,0.4338117202694962,0.4338117202694962,0.0,0.24300404877931653,0.2169058601347481,0.19080767149017966,0.026098188644568435,2,4,2,2.0,2,0.0,998999,0.6934354305267334,0.0024938583374023438,0.002553224563598633,21.599952220916748,1.9073486328125e-06,0.00806879997253418,0.6797149181365967,-0.004432007,-0.0058829254,-0.0073338435,0.0014509181,0.98679197,0.98251534,0.97823876,0.0042766035,440.564,1.0878772,0.8795528,0.6712284,0.20832437,0.07119025,0.055561554,0.039932854,0.0156287,0.06366714,0.046736993,0.029806845,0.016930148,0.7160932,0.7302138,0.013697105,0.0122417575,0.0107864095,0.001455348,1.1014193e-05,200,-0.17424563,-0.48487774,-0.8831331,0.2023349,0.051678017,0.05148844,0.051258426,0.00012519717,998999,1.0813023,0.8714981,0.661694,0.20980415,0.0,0.0,0.0,0.0
0,0,0,0.12498924,-0.07945812,-0.43564224,0.1438326,-0.22196420100855407,1,-0.22196420100855407,-0.22196420100855407,-0.22196420100855407,0.0,-0.06626331815569395,-0.11098210050427704,-0.15570088285286013,0.04471878234858309,4,8,2,2.0,2,0.0,999003,0.6045346260070801,0.0011963844299316406,0.0011255741119384766,22.207528352737427,3.814697265625e-05,0.010853290557861328,0.5892090797424316,-0.0010308158,-0.0048863282,-0.008741841,0.0038555125,0.9969123,0.9855138,0.9741154,0.011398464,180.96556,0.9284907,0.8786598,0.8288289,0.049830914,0.1675013,0.12049564,0.07348998,0.04700566,0.06015433,0.059967212,0.0597801,0.00018711574,0.5748209,0.67272204,0.030508472,0.026754959,0.023001445,0.003753513,1.1622354e-05,300,0.3537424,-0.43678454,-0.9513559,0.35695845,0.053244345,0.052891567,0.05234169,0.0002728698,999003,0.91071784,0.85639596,0.80207413,0.054321855,0.0,0.0,0.0,0.0
1,0,0,0.11573008,-0.044602025,-0.21003142,0.09092906,-0.10424991824240865,1,-0.10424991824240865,-0.10424991824240865,-0.10424991824240865,0.0,-0.010003530794350048,-0.05212495912120432,-0.0942463874480586,0.04212142832685428,5,10,2,2.0,2,0.0,999005,0.6860871315002441,0.0013425350189208984,0.0012538433074951172,22.896247386932373,3.790855407714844e-05,0.007896184921264648,0.6749513149261475,0.004231114,0.0035969168,0.0029627196,0.00063419715,1.0127742,1.010851,1.0089278,0.0019232035,123.68506,0.8583293,0.8315314,0.80473346,0.02679792,0.33825877,0.21806143,0.097864084,0.12019734,0.09187969,0.089366615,0.086853534,0.002513077,0.39795297,0.5513983,0.040352434,0.039215915,0.038079392,0.0011365209,9.338011e-06,400,0.40095848,-0.35091817,-0.9745383,0.52953124,0.054846372,0.054164585,0.053079303,0.00054456014,999005,0.81591684,0.78952396,0.7631311,0.026392877,0.0,0.0,0.0,0.0
