step,reward
0.0,-8.221975326538086
100000.0,-8.221975326538086
200000.0,-8.221975326538086
300000.0,-9.27554988861084
400000.0,-9.27554988861084
500000.0,-6.528637886047362
600000.0,-5.165244102478027
700000.0,-5.165244102478027
800000.0,-4.3412814140319815
900000.0,-4.3412814140319815
1000000.0,-3.794113159179688
1100000.0,-3.3985168933868413
1200000.0,-3.3985168933868413
1300000.0,-3.105924367904663
1400000.0,-2.8729479312896733
1500000.0,-2.8729479312896733
1600000.0,-2.692937135696411
1700000.0,-2.692937135696411
1800000.0,-2.540024757385254
1900000.0,-2.4794671535491943
2000000.0,-2.4794671535491943
2100000.0,-2.366174697875977
2200000.0,-2.366174697875977
2300000.0,-2.2725238800048833
2400000.0,-2.1882486343383794
2500000.0,-2.1882486343383794
2600000.0,-2.1165447235107417
2700000.0,-2.05133056640625
2800000.0,-2.05133056640625
2900000.0,-1.9929232597351076
3000000.0,-1.9929232597351076
3100000.0,-1.9410409927368164
3200000.0,-1.893988847732544
3300000.0,-1.893988847732544
3400000.0,-1.5333592891693115
3500000.0,-1.066927790641785
3600000.0,-1.066927790641785
3700000.0,-1.0658906698226929
3800000.0,-1.0658906698226929
3900000.0,-1.0622117519378662
4000000.0,-1.0607672929763794
4100000.0,-1.0607672929763794
4200000.0,-1.0578536987304688
4300000.0,-1.0578536987304688
4400000.0,-1.0574957132339478
4500000.0,-1.054606795310974
4600000.0,-1.054606795310974
4700000.0,-1.0550141334533691
4800000.0,-1.0514092445373535
4900000.0,-1.0514092445373535
5000000.0,-1.0524691343307495
5100000.0,-1.0524691343307495
5200000.0,-1.011839509010315
5300000.0,-1.6910988092422483
5400000.0,-1.6910988092422483
5500000.0,-1.6883456707000732
5600000.0,-1.6883456707000732
5700000.0,-1.6887900829315186
5800000.0,-1.6868271827697754
5900000.0,-1.6868271827697754
6000000.0,-1.6873457431793213
6100000.0,-1.687432050704956
6200000.0,-1.687432050704956
6300000.0,-1.6898148059844968
6400000.0,-1.6898148059844968
6500000.0,-1.6899876594543457
6600000.0,-1.690123438835144
6700000.0,-1.690123438835144
6800000.0,-1.6902592182159424
6900000.0,-1.69007408618927
7000000.0,-1.69007408618927
7100000.0,-1.690666675567627
7200000.0,-1.690666675567627
7300000.0,-1.6905062198638916
7400000.0,-1.6914197206497192
7500000.0,-1.6914197206497192
7600000.0,-1.6910246610641482
7700000.0,-1.6910246610641482
7800000.0,-1.6923826932907104
7900000.0,-1.692197561264038
8000000.0,-1.692197561264038
8100000.0,-1.6933085918426514
8200000.0,-1.692456841468811
8300000.0,-1.692456841468811
8400000.0,-1.6941604614257812
8500000.0,-1.6941604614257812
8600000.0,-1.0151481628417969
8700000.0,-1.0164937973022459
8800000.0,-1.0164937973022459
8900000.0,-1.0162838697433472
9000000.0,-1.0162838697433472
9100000.0,-1.0177778005599976
9200000.0,-1.017283916473389
9300000.0,-1.017283916473389
9400000.0,-1.0207036733627322
9500000.0,-1.0184073448181152
9600000.0,-1.0184073448181152
9700000.0,-1.0710493326187134
9800000.0,-1.0710493326187134
9900000.0,-1.070950627326965
