Metrics/EpRet,Metrics/EpCost,Metrics/EpLen,Train/Epoch,Train/Entropy,Train/KL,Train/StopIter,Train/PolicyRatio,Train/LR,Train/PolicyStd,TotalEnvSteps,Loss/Loss_pi,Loss/Loss_pi/Delta,Value/Adv,Loss/Loss_reward_critic,Loss/Loss_reward_critic/Delta,Value/reward,Time/Total,Time/Rollout,Time/Update,Time/Epoch,Time/FPS,Misc/Alpha,Misc/FinalStepNorm,Misc/gradient_norm,Misc/xHx,Misc/H_inv_g
-178.79351806640625,0.2800000011920929,55.119998931884766,0.0,1.378043293952942,0.0,10.0,0.9962406158447266,0.0,0.9600533843040466,2048.0,-0.08913429081439972,-0.08913429081439972,2.528540790081024e-07,1686.935546875,1686.935546875,-0.14448364078998566,5.198263168334961,4.091709136962891,1.1056640148162842,5.197443962097168,394.03997802734375,0.2244206666946411,0.33427420258522034,0.29370883107185364,0.39710402488708496,1.4894983768463135
-237.6625518798828,1.1515151262283325,78.1515121459961,1.0,1.3339864015579224,0.0,10.0,1.002729058265686,0.0,0.9186481833457947,4096.0,-0.09461010247468948,-0.005475811660289764,-1.3690441846847534e-07,1352.0322265625,-334.9033203125,-14.09510612487793,10.670058250427246,4.426172256469727,1.0115702152252197,5.437805652618408,376.62261962890625,0.22050604224205017,0.3292768597602844,0.30748632550239563,0.4113287031650543,1.4932781457901
