step,reward
0.0,-8.272988319396973
100000.0,-8.272988319396973
200000.0,-8.272988319396973
300000.0,-9.078031539916992
400000.0,-9.078031539916992
500000.0,-6.400168895721436
600000.0,-5.0646328926086435
700000.0,-5.0646328926086435
800000.0,-4.2675089836120605
900000.0,-4.2675089836120605
1000000.0,-3.728973388671875
1100000.0,-3.3485732078552246
1200000.0,-3.3485732078552246
1300000.0,-3.057378053665161
1400000.0,-2.8364896774291988
1500000.0,-2.8364896774291988
1600000.0,-2.653902530670166
1700000.0,-2.653902530670166
1800000.0,-3.1052088737487797
1900000.0,-2.929795265197754
2000000.0,-2.929795265197754
2100000.0,-2.7872185707092285
2200000.0,-2.7872185707092285
2300000.0,-2.6601595878601074
2400000.0,-2.55236291885376
2500000.0,-2.55236291885376
2600000.0,-2.456019401550293
2700000.0,-2.370429277420044
2800000.0,-2.370429277420044
2900000.0,-2.2948977947235107
3000000.0,-2.2948977947235107
3100000.0,-2.226745367050171
3200000.0,-2.165840148925781
3300000.0,-2.165840148925781
3400000.0,-1.8021907806396484
3500000.0,-1.358604907989502
3600000.0,-1.358604907989502
3700000.0,-1.3563950061798096
3800000.0,-1.3563950061798096
3900000.0,-1.354271650314331
4000000.0,-1.3503950834274292
4100000.0,-1.3503950834274292
4200000.0,-1.3493579626083374
4300000.0,-1.3493579626083374
4400000.0,-1.346049427986145
4500000.0,-1.345938205718994
4600000.0,-1.345938205718994
4700000.0,-1.3424690961837769
4800000.0,-1.343024730682373
4900000.0,-1.343024730682373
5000000.0,-1.0121234655380251
5100000.0,-1.0121234655380251
5200000.0,-1.014320969581604
5300000.0,-1.0104018449783323
5400000.0,-1.0104018449783323
5500000.0,-1.0376610755920408
5600000.0,-1.0376610755920408
5700000.0,-1.03556227684021
5800000.0,-1.0359573364257812
5900000.0,-1.0359573364257812
6000000.0,-1.0359573364257812
6100000.0,-1.0367105007171629
6200000.0,-1.0367105007171629
6300000.0,-1.036833882331848
6400000.0,-1.036833882331848
6500000.0,-1.0373153686523438
6600000.0,-1.0374017953872678
6700000.0,-1.0374017953872678
6800000.0,-1.0375375747680664
6900000.0,-1.0378339290618896
7000000.0,-1.0378339290618896
7100000.0,-1.0376734733581543
7200000.0,-1.0376734733581543
7300000.0,-1.0384635925292969
7400000.0,-1.0383524894714355
7500000.0,-1.0383524894714355
7600000.0,-1.0393401384353638
7700000.0,-1.0393401384353638
7800000.0,-1.0390437841415403
7900000.0,-1.0400807857513428
8000000.0,-1.0400807857513428
8100000.0,-1.0395623445510864
8200000.0,-1.0409573316574097
8300000.0,-1.0409573316574097
8400000.0,-1.0393648147583008
8500000.0,-1.0393648147583008
8600000.0,-1.0408147573471072
8700000.0,-1.0136666297912598
8800000.0,-1.0136666297912598
8900000.0,-1.0147531032562256
9000000.0,-1.0147531032562256
9100000.0,-1.0144814252853394
9200000.0,-1.0171852111816406
9300000.0,-1.0171852111816406
9400000.0,-1.0163209438323977
9500000.0,-1.055135726928711
9600000.0,-1.055135726928711
9700000.0,-1.0546419620513916
9800000.0,-1.0546419620513916
9900000.0,-1.0584814548492432
