Time	Iteration	AverageReward	StdRewards	MaxRewardRollout	MinRewardRollout	timesteps	gradnorms	maxnorms
10.080000400543213	0	-0.3498906868886691	0.6482505264815465	1.0967403771370912	-1.8064589863235274	0	0.0	0
93.8617422580719	10	-0.19991174106893425	0.7338130305402482	1.8237893303599195	-2.108518119498436	2400000	0.909090909090909	0.09901475429766744
176.39925336837769	20	1172.8322012420158	46.244731425161056	1219.0303669644054	1080.6053216815926	4800000	0.9523809523809522	0.09901475429766744
257.74491333961487	30	2199.3719284350836	13.88311812110414	2228.8445254880935	2145.7929251259193	7200000	0.9677419354838709	0.09901475429766744
337.6819052696228	40	2263.047655008557	24.176771837284793	2311.2021729662083	2199.5219673578395	9600000	0.9756097560975608	0.09901475429766744
417.7592263221741	50	2097.6978807062	254.004036663635	2212.3783843666315	169.29343294736464	12000000	0.980392156862745	0.09901475429766744
497.86663699150085	60	2266.112467184388	143.8645658774255	2328.1862239688635	852.4207168139365	14400000	0.983606557377049	0.09901475429766744
578.2599608898163	70	2313.541182554351	19.185240656958733	2358.1161210192367	2257.162448538351	16800000	0.9859154929577463	0.09901475429766744
658.3343255519867	80	2300.6061676979375	25.088271666270497	2357.034910337068	2189.4490164313465	19200000	0.9876543209876542	0.09901475429766744
737.5059659481049	90	2405.6398175874865	28.370079860816716	2465.574371576309	2331.9565918724984	21600000	0.9890109890109888	0.09901475429766744
815.8199417591095	100	2485.8793741995573	19.869576223646323	2525.432076444122	2414.0034196353517	24000000	0.99009900990099	0.09901475429766744
893.1794672012329	110	2350.9918571489475	189.17617265339902	2422.7704461067915	486.5224049910903	26400000	0.9909909909909909	0.09901475429766744
971.0440831184387	120	2681.314798711211	349.36557735925146	2802.340538226068	202.07293854959426	28800000	0.9917355371900826	0.09901475429766744
1049.2757098674774	130	2315.467592212241	20.3139052129866	2374.287958937697	2256.73316986009	31200000	0.9923664122137402	0.09901475429766744
1125.4127144813538	140	2356.806887079376	433.86398701855524	2474.547016062308	-194.51031529229112	33600000	0.9929078014184395	0.09901475429766744
1202.7461190223694	150	2623.593802919304	124.82818219670848	2684.825140872039	1397.7329913840804	36000000	0.9933774834437085	0.09901475429766744
1280.2172627449036	160	2643.778969834994	24.13881841428738	2688.2949518542737	2565.3823470957577	38400000	0.9937888198757763	0.09901475429766744
1358.4599792957306	170	2813.575758607522	25.197357255654804	2875.7578401379287	2745.7526702089235	40800000	0.9941520467836256	0.09901475429766744
1436.1875615119934	180	2637.741700545852	178.9014802530799	2737.3944444609806	883.7335408055224	43200000	0.9944751381215468	0.09901475429766744
1515.699509859085	190	2717.6253289234674	26.279570443542774	2774.2164091579616	2658.1122207927983	45600000	0.994764397905759	0.09901475429766744
1592.9754745960236	200	2860.1221399507335	23.247132706700633	2909.1654779752716	2807.452522849664	48000000	0.9950248756218905	0.09901475429766744
