rf_loss,log-pi-max,alpha-avg,episode-length-avg,pool-size,mean-sq-bellman-error1,qf2-std,time-train,last-path-return,mean-sq-bellman-error2,episode-length-max,log-sigs-min,return-average,time-total,qf1-std,avg-path-return,log-pi-min,episodes,log-pi-std,log-pi-mean,total-samples,return-max,policy-mus-max,time-sample,rf_q-std,rf_pi-std,div-avg,log-sigs-mean,episode-length-std,vf-avg,qf2-avg,log-sigs-std,vf-std,log-sigs-max,rf_q-avg,episode-length-min,policy-mus-std,epoch,qf1-avg,alpha-std,mean-qf-diff,policy-mus-min,time-eval,policy-mus-mean,return-min,rf_pi-avg,max-path-return,return-std
0.048912,-0.491318,0.697215,1000.0,1000,0.682164,0.442067,0.3731979699805379,0.0,1.00841,1000,-3.11804,0.0,1.415129104629159,0.442067,0.0,-14.7734,1,2.2928,-6.73352,1000,0.0,1.9594,0.1744159096851945,0.106252,0.106099,-0.0489119,-0.289727,0.0,-0.245077,-0.0718279,0.648345,0.509356,1.80905,0.689019,1000,0.640447,0,-0.0718279,0.06073,0.797232,-2.76867,0,-0.331193,0.0,0.685908,0.0,0.0
