Metrics/EpRet,Metrics/EpCost,Metrics/EpLen,Train/Epoch,Train/Entropy,Train/KL,Train/StopIter,Train/PolicyRatio,Train/LR,Train/PolicyStd,TotalEnvSteps,Loss/Loss_pi,Loss/Loss_pi/Delta,Value/Adv,Loss/Loss_reward_critic,Loss/Loss_reward_critic/Delta,Value/reward,Time/Total,Time/Rollout,Time/Update,Time/Epoch,Time/FPS
-178.79351806640625,0.2800000011920929,55.119998931884766,0.0,1.4139022827148438,0.03477708250284195,3.0,0.995556652545929,0.0001500000071246177,0.994982898235321,2048.0,-0.0314510278403759,-0.0314510278403759,-0.12468741834163666,2110.103759765625,2110.103759765625,-0.14448364078998566,4.811440944671631,4.10282039642334,0.7073924541473389,4.810637474060059,425.72332763671875
-179.4430389404297,0.35483869910240173,56.0,1.0,1.4029006958007812,0.027002619579434395,5.0,0.9962325096130371,0.0,0.9841020703315735,4096.0,-0.028531571850180626,0.0029194559901952744,-0.23381422460079193,2087.865966796875,-22.23779296875,-1.619920253753662,10.351533889770508,4.4213104248046875,1.0958952903747559,5.517416954040527,371.18829345703125
