step,reward
0.0,-8.504481315612793
100000.0,-8.504481315612793
200000.0,-8.504481315612793
300000.0,-8.92434024810791
400000.0,-8.92434024810791
500000.0,-6.2947449684143075
600000.0,-4.983960151672363
700000.0,-4.983960151672363
800000.0,-4.196205139160156
900000.0,-4.196205139160156
1000000.0,-3.672228574752808
1100000.0,-3.337218761444092
1200000.0,-3.337218761444092
1300000.0,-3.0477824211120605
1400000.0,-2.824530839920044
1500000.0,-2.824530839920044
1600000.0,-2.6438310146331787
1700000.0,-2.6438310146331787
1800000.0,-2.497377157211304
1900000.0,-2.374797344207764
2000000.0,-2.374797344207764
2100000.0,-2.2714369297027592
2200000.0,-2.2714369297027592
2300000.0,-2.182365894317627
2400000.0,-2.1055662631988525
2500000.0,-2.1055662631988525
2600000.0,-2.0382740497589107
2700000.0,-1.9787530899047847
2800000.0,-1.9787530899047847
2900000.0,-1.926764726638794
3000000.0,-1.926764726638794
3100000.0,-1.8794171810150144
3200000.0,-2.1613721847534184
3300000.0,-2.1613721847534184
3400000.0,-1.7875926494598389
3500000.0,-1.7875926494598389
3600000.0,-1.3703826665878296
3700000.0,-1.3699506521224976
3800000.0,-1.3699506521224976
3900000.0,-1.367370367050171
4000000.0,-1.366493821144104
4100000.0,-1.366493821144104
4200000.0,-1.3638765811920166
4300000.0,-1.3638765811920166
4400000.0,-1.349123477935791
4500000.0,-1.3480370044708252
4600000.0,-1.3480370044708252
4700000.0,-1.3479382991790771
4800000.0,-1.3470617532730105
4900000.0,-1.3470617532730105
5000000.0,-1.348888874053955
5100000.0,-1.348888874053955
5200000.0,-1.3475679159164429
5300000.0,-1.350617289543152
5400000.0,-1.350617289543152
5500000.0,-1.348985195159912
5600000.0,-1.348985195159912
5700000.0,-1.3510839939117432
5800000.0,-1.3496395349502563
5900000.0,-1.3496395349502563
6000000.0,-1.3494173288345337
6100000.0,-1.3472691774368286
6200000.0,-1.3472691774368286
6300000.0,-1.3469605445861816
6400000.0,-1.3469605445861816
6500000.0,-1.0210345983505251
6600000.0,-1.0210715532302856
6700000.0,-1.0210715532302856
6800000.0,-1.0210715532302856
6900000.0,-1.0210715532302856
7000000.0,-1.0216271877288818
7100000.0,-1.0216271877288818
7200000.0,-1.0216271877288818
7300000.0,-1.0226271152496338
7400000.0,-1.0226271152496338
7500000.0,-1.0226271152496338
7600000.0,-1.023046851158142
7700000.0,-1.023046851158142
7800000.0,-1.023046851158142
7900000.0,-1.023614764213562
8000000.0,-1.023614764213562
8100000.0,-1.023614764213562
8200000.0,-1.0225160121917725
8300000.0,-1.0225160121917725
8400000.0,-1.0225160121917725
8500000.0,-1.0225160121917725
8600000.0,-1.020565390586853
8700000.0,-1.0209752321243286
8800000.0,-1.0209752321243286
8900000.0,-1.042678952217102
9000000.0,-1.042678952217102
9100000.0,-1.0394123792648315
9200000.0,-1.111375331878662
9300000.0,-1.111375331878662
9400000.0,-1.1079851388931274
9500000.0,-1.1069605350494385
9600000.0,-1.1069605350494385
9700000.0,-1.1069852113723757
9800000.0,-1.1069852113723757
9900000.0,-1.1055036783218384
