step,reward
40000,-195.9440460205078
80000,-180.01258850097656
120000,-157.58216857910156
160000,-122.20491790771484
200000,-103.43863677978516
240000,-100.63526916503906
280000,-71.69869995117188
320000,-64.31105041503906
360000,-74.0600357055664
400000,-75.29529571533203
440000,-73.69784545898438
480000,-67.62947082519531
520000,-77.39163208007812
560000,-47.03382110595703
600000,-21.613473892211914
640000,-34.777957916259766
680000,-51.35337448120117
720000,-61.158470153808594
760000,-36.000892639160156
800000,-18.835947036743164
840000,-23.21925163269043
880000,-28.95142936706543
920000,4.990861892700195
960000,12.229146957397461
1000000,-10.643450736999512
1040000,3.7378711700439453
1080000,10.028675079345703
1120000,-14.938220024108887
1160000,-11.253103256225586
1200000,-18.241344451904297
1240000,11.024599075317383
1280000,-18.72162437438965
1320000,-42.19297790527344
1360000,-1.8093689680099487
1400000,-17.611621856689453
1440000,-13.785252571105957
1480000,-3.269179105758667
1520000,18.93478775024414
1560000,-29.418127059936523
1600000,7.223623275756836
1640000,-43.689659118652344
1680000,4.978233814239502
1720000,-10.250267028808594
1760000,-34.65861129760742
1800000,0.8100723624229431
1840000,-15.178393363952637
1880000,-8.986491203308105
1920000,32.62478256225586
1960000,3.5723798274993896
2000000,46.855770111083984
