loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,2.626249569442986
-12255.7353515625,720.7276134490967,4219.286907553673,3498.559294104576,895.3296748982965
-16767.271484375,73.46349668502808,5738.304911136627,5664.841414451599,824.656640593302
-18108.94140625,38.514262199401855,6184.36563873291,6145.851376533508,466.91869084906455
-19014.3828125,29.461091995239258,6485.349184036255,6455.888092041016,689.5435945814974
-19636.49609375,19.21620464324951,6692.540105819702,6673.323901176453,1215.9218784698571
-20285.306640625,14.324013710021973,6908.7468938827515,6894.4228801727295,3025.1956754488283
-20868.224609375,22.845949172973633,7102.079367637634,7079.233418464661,1174.8798862767583
-21257.294921875,11.510273933410645,7231.977365493774,7220.467091560364,1644.9169175498175
-21651.798828125,10.382532119750977,7363.413599014282,7353.031066894531,966.4862361915845
-22120.60546875,14.047517776489258,7519.110057830811,7505.062540054321,933.6788381496501
-22211.83984375,2.186697006225586,7550.266260147095,7548.079563140869,1194.5348825811855
-22599.625,-3.988551139831543,7679.418901443481,7683.407452583313,983.5941466248779
-22796.615234375,-18.209155082702637,7745.577710151672,7763.786865234375,887.5523885267605
-23186.94921875,-10.700075149536133,7874.958689689636,7885.658764839172,884.8808424955856
-22617.453125,-65.9310891032219,7688.796514511108,7754.72760361433,886.0320059631701
-23672.4765625,-19.408906936645508,8036.986391067505,8056.39529800415,1025.0851643348697
-23889.60546875,-18.987034797668457,8109.063775062561,8128.0508098602295,2648.632406056887
-24089.29296875,-17.974703788757324,8175.545335769653,8193.52003955841,1495.0518507270194
-24168.12890625,-21.522132873535156,8202.179924964905,8223.70205783844,1334.7154332559826
-24478.61328125,-8.932072639465332,8304.734497070312,8313.666569709778,3419.850513225295
-24517.298828125,-15.20019817352295,8318.211835861206,8333.412034034729,2437.3642218005275
-24707.330078125,-17.250228881835938,8381.571864128113,8398.822093009949,1806.9019625458418
-24848.421875,-13.484633445739746,8428.403945922852,8441.888579368591,892.2665714220071
-24985.208984375,-17.659099578857422,8474.021381378174,8491.680480957031,422.4286618223298
-25014.263671875,-18.343796253204346,8483.925505161285,8502.26930141449,853.4915643434862
-24918.783203125,-54.563936829566956,8454.205844759941,8508.769781589508,969.7639903897472
-25493.755859375,-13.98228645324707,8643.395364761353,8657.3776512146,1489.1042740895443
-25526.91015625,-18.3917875289917,8654.484155654907,8672.875943183899,428.35265357440124
-25657.8984375,-26.923908233642578,8698.742835998535,8725.666744232178,1450.6099129406782
-25855.5234375,-1.5076475143432617,8763.117776870728,8764.62542438507,4407.277313984412
-25944.1015625,-22.678730010986328,8793.744908332825,8816.423638343811,3346.89811033757
-26165.046875,-15.943984985351562,8866.850952148438,8882.794937133789,3348.1395583590174
-26126.48828125,-20.413219451904297,8854.388370513916,8874.80158996582,881.1908187873755
-26275.009765625,-10.66858196258545,8903.386358261108,8914.054940223694,1273.1446264146198
-26213.765625,-23.681259155273438,8883.767007827759,8907.448266983032,862.7539046669605
-26018.09375,-50.20064967870712,8820.226152956486,8870.426802635193,954.9831193280143
-26534.771484375,-15.808156967163086,8989.945510864258,9005.75366783142,1278.2565817929496
-26553.119140625,-17.262990951538086,8996.559745788574,9013.822736740112,3141.7759826207716
-26510.7734375,-43.12429618835449,8983.591206550598,9026.715502738953,856.2652156343321
-26893.203125,-8.533574104309082,9109.220131874084,9117.753705978394,923.3625355454369
-26896.1796875,-9.62571907043457,9110.396492004395,9120.02221107483,1664.8784378624762
-26863.1953125,-15.520197868347168,9099.75726222992,9115.277460098267,855.4329645998075
-27019.90234375,-7.403800010681152,9151.467069625854,9158.870869636536,2671.964959410697
-27183.75,-9.681770324707031,9206.136280059814,9215.818050384521,1000.8603429005436
-27131.08203125,-22.311955451965332,9189.456816673279,9211.768772125244,1820.8841590455881
-26920.24609375,-45.014761447906494,9120.64090681076,9165.655668258667,1623.5091309649556
-27345.73046875,-18.127361297607422,9260.428745269775,9278.556106567383,893.931595110161
-27549.015625,-12.375826835632324,9327.790602684021,9340.166429519653,1369.4463920290618
-27387.951171875,-17.94197177886963,9274.861004829407,9292.802976608276,871.815739225711
-27491.841796875,-24.49762725830078,9309.640585899353,9334.138213157654,997.4993848167437
-27278.03125,-42.322142601013184,9239.81997013092,9282.142112731934,859.9053025875708
-27061.55078125,-59.860814332962036,9168.810201406479,9228.671015739441,854.1310932095859
-27902.873046875,-5.712028503417969,9445.339668273926,9451.051696777344,431.2698923975629
-27095.25390625,-72.88888049125671,9180.687675714493,9253.57655620575,1099.9019988515215
-27813.671875,-19.379313468933105,9416.657670021057,9436.03698348999,998.110905264902
-27906.125,-13.353522300720215,9446.958686828613,9460.312209129333,1454.5804845969778
-28040.349609375,-9.602664947509766,9491.322448730469,9500.925113677979,888.8160315732634
-28199.037109375,-7.012002944946289,9543.91541671753,9550.927419662476,1839.519350904855
-28042.775390625,-28.90143871307373,9493.130647659302,9522.032086372375,981.219960428032
-27936.826171875,-30.261423110961914,9458.35438632965,9488.615809440613,849.5478211153944
-28280.61328125,-3.201875686645508,9571.23871421814,9574.440589904785,902.6401976858045
-27978.251953125,-33.91966152191162,9472.210035324097,9506.129696846008,1244.8612582644914
-28361.111328125,-16.5152645111084,9598.763116836548,9615.278381347656,1024.644835165145
-28204.599609375,-23.498026847839355,9547.052146911621,9570.55017375946,857.925595666514
-28349.35546875,-39.418012619018555,9595.909008979797,9635.327021598816,904.8132286870477
-28129.974609375,-36.63183546066284,9523.2275557518,9559.859391212463,844.9110041873398
-28484.1640625,-18.78252601623535,9639.79863166809,9658.581157684326,867.3425542811648
-28329.90625,-30.74413824081421,9589.314383029938,9620.058521270752,1941.629913215245
-28414.654296875,-36.331932067871094,9617.664155960083,9653.996088027954,931.8141419457088
-28722.5,-19.729275703430176,9719.12941646576,9738.85869216919,1691.6002108992109
-28736.572265625,-16.725337982177734,9723.753050804138,9740.478388786316,833.1868191240153
-28434.890625,-32.54183387756348,9624.486987113953,9657.028820991516,3280.665561632458
-28650.388671875,-25.495593070983887,9695.821042060852,9721.316635131836,848.2645359672856
-28657.740234375,-24.413169860839844,9698.210809707642,9722.623979568481,719.1913069403148
-28834.9921875,-21.567927360534668,9756.912281990051,9778.480209350586,862.1159389552613
-28909.955078125,-17.304200172424316,9781.651043891907,9798.955244064331,798.9718011265089
-28258.03125,-76.86338424682617,9568.0855178833,9644.948902130127,421.5550684755027
-28569.927734375,-83.86681652069092,9671.848170280457,9755.714986801147,1214.6784091058373
-28802.021484375,-23.568446159362793,9746.340923309326,9769.909369468689,687.5927959555033
-28648.853515625,-44.190566062927246,9696.56263923645,9740.753205299377,856.7500383369977
-28899.353515625,-20.754191398620605,9778.416082382202,9799.170273780823,940.7510127443201
-29116.13671875,-16.654071807861328,9850.186171531677,9866.840243339539,821.5724116514522
-29286.4765625,-0.9844274520874023,9906.224640846252,9907.20906829834,592.5500476239383
-28157.580078125,-91.14067268371582,9535.914407253265,9627.055079936981,999.4693751419607
-29396.982421875,7.982956886291504,9942.580457687378,9934.597500801086,1898.116536477305
-29005.25390625,-28.779501914978027,9814.474899291992,9843.25440120697,963.8345796373093
-29162.142578125,-20.26508903503418,9866.02744102478,9886.292530059814,961.4664867092213
-29153.447265625,-25.459221839904785,9863.538847923279,9888.998069763184,864.8638736839487
-29433.154296875,-2.517228126525879,9955.248460769653,9957.76568889618,861.988604903146
-29293.58984375,-14.790383338928223,9909.456408500671,9924.2467918396,1058.6907018793952
-29330.779296875,-16.719456672668457,9922.010231018066,9938.729687690735,620.8306429605534
-29605.447265625,3.3169336318969727,10012.167284965515,10008.850351333618,2445.3521647344996
-29296.69140625,-19.840630531311035,9911.022694587708,9930.863325119019,1642.2667543902726
-29662.8515625,-5.546308517456055,10031.790964126587,10037.337272644043,1183.4292648625394
-29539.5625,-4.762831687927246,9990.843567848206,9995.606399536133,1008.0902479713159
-29640.13671875,-6.995465278625488,10024.405532836914,10031.40099811554,1087.2265415215888
-29654.794921875,-8.038026809692383,10029.297281265259,10037.335308074951,2113.45127591836
-29597.939453125,-18.323981285095215,10011.08803653717,10029.412017822266,1248.6551065739127
-29617.662109375,-11.947700500488281,10017.313598632812,10029.2612991333,865.0915379392841
-29394.1640625,-33.38359260559082,9944.086711883545,9977.470304489136,1168.158692743279
-30060.00390625,17.49608325958252,10162.880787849426,10145.384704589844,1019.0251445687524
-29681.3125,-16.134318351745605,10038.77679347992,10054.911111831665,1572.1895848921429
-29886.69921875,-1.213334083557129,10106.207503318787,10107.420837402344,888.3779813839134
-30180.189453125,14.807422637939453,10202.74006652832,10187.93264389038,1371.7575962472595
-30171.640625,14.806678771972656,10200.10957145691,10185.302892684937,2455.3174434269104
-30039.7578125,7.390705108642578,10156.741926193237,10149.351221084595,1336.4543806276488
-30111.80078125,14.071066856384277,10180.316752433777,10166.245685577393,861.7540325067738
-29978.47265625,-16.601943969726562,10137.579078674316,10154.181022644043,3716.393721550458
-29826.0,-12.064606666564941,10086.852896690369,10098.917503356934,1676.0966333876345
-30383.837890625,14.197771072387695,10270.708543777466,10256.510772705078,1295.3945812972772
-30078.08984375,-12.392915725708008,10170.525001525879,10182.917917251587,1097.8514986266264
-30266.8515625,4.17439079284668,10232.498918533325,10228.324527740479,2095.6522709844767
-30270.708984375,9.952554702758789,10233.45464515686,10223.502090454102,859.1807581073515
-30252.21875,-3.411672592163086,10227.916812896729,10231.328485488892,520.9187321386869
-30567.72265625,15.301559448242188,10331.943079948425,10316.641520500183,859.0473123755977
-30603.083984375,16.822507858276367,10343.516941070557,10326.69443321228,2293.8390067732166
-30483.251953125,5.126164436340332,10304.474720954895,10299.348556518555,919.7755103751902
-30166.767578125,-11.541905403137207,10200.307408332825,10211.849313735962,1101.7205729420675
-30410.98828125,-0.855198860168457,10280.907437324524,10281.762636184692,1105.5982810176654
-30440.64453125,-19.977195739746094,10291.617950439453,10311.5951461792,1845.631011535397
-30590.716796875,11.510334968566895,10339.801943778992,10328.291608810425,1155.348766597853
-30524.947265625,1.9747657775878906,10318.712516784668,10316.73775100708,1213.3408107256225
-30466.462890625,-0.13077735900878906,10299.263120651245,10299.393898010254,890.0126322628162
-30235.423828125,-36.906514167785645,10224.682767868042,10261.589282035828,1202.5703777297701
-30118.173828125,-66.31218719482422,10186.671188354492,10252.983375549316,3485.5589026427133
-30601.615234375,-0.8757638931274414,10344.155836105347,10345.031599998474,1409.2130930184069
-30831.73046875,17.954051971435547,10419.773419380188,10401.819367408752,1238.2136019911911
-30094.6875,-39.01953125,10177.86272239685,10216.88225364685,1563.2814649252934
-30592.673828125,-15.097574234008789,10342.05659866333,10357.154172897339,842.7385221205845
-30431.486328125,-11.305205345153809,10288.58090877533,10299.886114120483,997.5100337792599
-30913.08984375,16.257301330566406,10446.949565887451,10430.692264556885,885.3280676381526
-30615.775390625,-22.61033821105957,10350.370034217834,10372.980372428894,1006.1196892168302
-30159.259765625,-64.03315496444702,10200.802213191986,10264.835368156433,835.4659538689026
-30933.37890625,22.430145263671875,10453.751430511475,10431.321285247803,1825.8997004850626
-30976.955078125,6.600539207458496,10468.764388084412,10462.163848876953,1442.7469395745813
-30672.162109375,-3.281522750854492,10368.121870040894,10371.403392791748,844.5241995122548
-30545.431640625,-58.249295234680176,10328.928619384766,10387.177914619446,1178.153149452287
-30668.609375,-35.12723731994629,10368.55148601532,10403.678723335266,1336.815009340155
-31087.8125,6.181650161743164,10505.613803863525,10499.432153701782,857.333321814305
-30512.68359375,-43.61684811115265,10317.328974604607,10360.94582271576,633.4172805800218
-31000.544921875,10.447936058044434,10476.763494491577,10466.315558433533,871.4292244772844
-30845.921875,-12.167729377746582,10426.506051063538,10438.673780441284,829.7537922654544
-30708.212890625,-31.138079404830933,10381.600775957108,10412.738855361938,6494.56913735173
-30830.890625,-10.214411735534668,10421.390169143677,10431.604580879211,1428.9050954571376
-31183.369140625,6.502471923828125,10537.683288574219,10531.18081665039,998.7142649431615
-31253.216796875,9.741626739501953,10560.707378387451,10550.96575164795,2364.776227192437
-31190.349609375,9.507087707519531,10539.790393829346,10530.283306121826,551.5269656728972
-30545.998046875,-55.8402214050293,10329.034430503845,10384.874651908875,1657.3518168925984
-31203.853515625,8.348543167114258,10544.593524932861,10536.244981765747,1272.4213164429434
-31488.5390625,22.00111198425293,10638.342308044434,10616.34119606018,1237.8930812994201
-31172.166015625,7.201169013977051,10533.984817504883,10526.783648490906,822.7703546332124
-31119.521484375,-9.444477081298828,10517.203797340393,10526.648274421692,4511.807731016613
-30828.748046875,-41.651137351989746,10422.491691589355,10464.142828941345,1537.579821180326
-31396.482421875,2.5801029205322266,10608.785074234009,10606.204971313477,2499.015844200426
-30994.654296875,-39.44447994232178,10477.650339126587,10517.094819068909,1000.1679402828469
-30739.619140625,-56.8097038269043,10393.506963729858,10450.316667556763,673.4822325098884
-31200.017578125,-10.912797927856445,10544.272506713867,10555.185304641724,907.3860596917707
-31277.998046875,-8.694107055664062,10570.182384490967,10578.87649154663,1712.9091921040067
-29089.294921875,-218.46378874778748,9854.054744958878,10072.518533706665,1418.226860151936
-31272.033203125,-9.117144703865051,10568.264018893242,10577.381163597107,922.7322458298684
-31347.4140625,-16.255218505859375,10593.534896850586,10609.790115356445,924.1041489047185
-30926.98828125,-59.7093448638916,10456.297461509705,10516.006806373596,1355.4952142804736
-31410.2890625,-11.436899185180664,10614.113215446472,10625.550114631653,674.0130097984724
-30762.8671875,-74.87956666946411,10402.707872867584,10477.587439537048,2265.1656188681345
-31726.607421875,14.080198287963867,10718.202461242676,10704.122262954712,1262.5517117981033
-31296.34375,-35.61035394668579,10577.688677310944,10613.29903125763,1983.909886170626
-31333.57421875,-15.639280319213867,10589.243579864502,10604.882860183716,816.2663058296454
-31693.166015625,-2.5892763137817383,10707.940084457397,10710.52936077118,846.1445925673171
-31274.271484375,-18.587780952453613,10569.752696990967,10588.34047794342,1148.0985079716504
-31600.12109375,-13.072979927062988,10677.587023735046,10690.66000366211,1335.7035548723838
-31561.25390625,-10.453447341918945,10664.455671310425,10674.909118652344,964.0520299308643
-31390.21875,-24.769298553466797,10608.535906791687,10633.305205345154,1183.919413133999
-32049.044921875,29.552743911743164,10824.634202957153,10795.08145904541,6581.700518535094
-31598.7734375,-20.961423873901367,10677.555641174316,10698.517065048218,1345.4144133670982
-31986.203125,21.630069732666016,10804.267728805542,10782.637659072876,1449.411649786331
-31281.2421875,-51.866812229156494,10573.50206708908,10625.368879318237,1304.8837648889953
-31557.73828125,-32.73534393310547,10664.562419891357,10697.297763824463,1229.8464505072736
-32225.3046875,32.6833553314209,10882.88843345642,10850.205078125,3094.1787851717313
-31958.83984375,9.316634178161621,10795.74224948883,10786.425615310669,2214.3299995974085
-31173.330078125,-54.291945457458496,10538.091311454773,10592.383256912231,1309.4792131863192
-32090.08984375,-0.647089958190918,10839.704899787903,10840.351989746094,2014.2034077047324
-31987.330078125,-5.947264671325684,10806.03949546814,10811.986760139465,1252.2962393778857
-32040.201171875,11.34954833984375,10822.680038452148,10811.330490112305,831.0583577822072
-31757.154296875,-51.56511688232422,10731.573488235474,10783.138605117798,1337.6329578265186
-31835.31640625,-30.63460874557495,10756.879284381866,10787.513893127441,1650.0674820022027
-31751.537109375,-47.42110061645508,10729.872095108032,10777.293195724487,705.68330247236
-31721.1171875,-52.37631702423096,10719.754874229431,10772.131191253662,833.7537312235685
-32010.806640625,-10.000865936279297,10814.189659118652,10824.190525054932,1215.0079544731382
-31910.99609375,-22.551108360290527,10781.729537963867,10804.280646324158,830.7248214874363
-31785.615234375,-36.76638984680176,10740.902369499207,10777.668759346008,1319.5925482644554
-31123.203125,-104.38053321838379,10523.905090332031,10628.285623550415,2021.5806899083098
-32523.259765625,22.34318733215332,10982.58557510376,10960.242387771606,1565.8774725469011
-32499.720703125,24.994853973388672,10974.762691497803,10949.767837524414,1126.5932581552393
-32364.953125,14.055831909179688,10930.600412368774,10916.544580459595,1161.9648877505635
-31326.08203125,-78.8742425441742,10590.482243776321,10669.356486320496,1171.4539624783954
-32138.37890625,-14.534785270690918,10856.958245277405,10871.493030548096,992.4716003269074
-31878.01953125,-75.23758506774902,10773.487552642822,10848.725137710571,893.1662461928421
-31653.4609375,-38.67675304412842,10697.286479949951,10735.96323299408,1214.6776627666482
-31542.259765625,-117.59293174743652,10664.327176094055,10781.920107841492,803.4573036923906
-31662.1484375,-57.66806221008301,10701.097321510315,10758.765383720398,1264.2216326354073
