loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,9.01411503317385
-11997.6962890625,852.9799837321043,4184.132170021534,3331.1521862894297,680.8778270117374
-16688.146484375,149.43804550170898,5773.179578781128,5623.741533279419,677.8591631346596
-17860.35546875,121.0230484008789,6161.280475616455,6040.257427215576,799.0305823894005
-18737.837890625,97.8264331817627,6452.740210533142,6354.913777351379,1465.526941458526
-19372.083984375,88.33918380737305,6664.084265708923,6575.74508190155,2361.964442087564
-19842.326171875,92.41727256774902,6819.320410728455,6726.903138160706,1298.088175696125
-20343.75,81.05296993255615,6986.105819702148,6905.052849769592,3141.4570036925797
-21018.734375,84.2094144821167,7208.616321563721,7124.406907081604,1510.1230360505267
-21248.056640625,88.34310913085938,7284.529809951782,7196.186700820923,799.5239734264223
-21266.451171875,64.33624458312988,7294.396743774414,7230.060499191284,447.98136249151463
-21947.859375,87.4738712310791,7517.109110832214,7429.635239601135,2402.258470602604
-22286.88671875,83.19209289550781,7630.267595291138,7547.07550239563,937.0892326091621
-22522.52734375,83.61148929595947,7708.541996002197,7624.930506706238,1056.4366467971176
-22801.435546875,80.3524808883667,7801.684673309326,7721.3321924209595,2236.9500199168697
-22860.513671875,64.58402872085571,7823.478391170502,7758.894362449646,1163.194004489007
-22884.998046875,53.065003395080566,7833.352576255798,7780.287572860718,6167.665875934248
-23363.033203125,69.18459510803223,7989.442131996155,7920.257536888123,1224.532843890835
-23327.607421875,49.58146619796753,7980.286793231964,7930.705327033997,463.6988785560885
-23616.96875,69.04936599731445,8073.889879226685,8004.84051322937,485.7990788500559
-23875.7578125,66.86273574829102,8159.974925994873,8093.112190246582,2435.992784755182
-24024.833984375,61.2277889251709,8210.350244522095,8149.122455596924,1514.829005060584
-24184.931640625,71.51877212524414,8262.557938575745,8191.0391664505005,999.6358355032991
-24162.7890625,53.187076568603516,8257.189324378967,8204.002247810364,945.2621188466669
-24192.79296875,52.951022148132324,8267.469093322754,8214.518071174622,759.1333237558988
-24563.529296875,71.56840991973877,8388.076183319092,8316.507773399353,805.901957470129
-24680.810546875,71.90936756134033,8427.38101863861,8355.47165107727,607.8680954409665
-24213.0625,16.902660369873047,8279.14566707611,8262.243006706238,1298.2699140762052
-24790.2890625,54.85383224487305,8465.966669082642,8411.112836837769,1137.2790611882403
-24623.88671875,37.5250129699707,8412.878351211548,8375.353338241577,644.940918980966
-25105.37109375,57.55278301239014,8569.701738357544,8512.148955345154,956.8132640837342
-25258.728515625,64.05788898468018,8619.747436523438,8555.689547538757,2377.446068880248
-25203.501953125,52.46460151672363,8603.148593902588,8550.683992385864,1330.935449955219
-25371.87109375,64.62921333312988,8657.745133399963,8593.115920066833,3087.8655780587537
-25450.849609375,53.93661308288574,8685.155165672302,8631.218552589417,435.4224685350843
-25508.755859375,55.64912033081055,8704.837817192078,8649.188696861267,1612.51963179016
-25634.625,64.13466739654541,8745.34963130951,8681.214963912964,614.0616865952809
-25800.318359375,53.97875118255615,8800.838642120361,8746.859890937805,1832.5500700092405
-25697.208984375,50.45810031890869,8767.954305648804,8717.496205329895,1327.8576475573743
-25758.134765625,46.17251014709473,8788.434992790222,8742.262482643127,2268.9341977172166
-25989.734375,53.74165725708008,8864.230498313904,8810.488841056824,741.4913614472748
-26021.90234375,37.83370304107666,8876.294096946716,8838.46039390564,867.0263938933251
-26024.298828125,41.14664840698242,8877.283719062805,8836.137070655823,803.538111000816
-26289.625,53.07698345184326,8963.6965341568,8910.619550704956,761.488673229539
-25609.3828125,-1.9524269104003906,8745.103203296661,8747.055630207062,1352.7259711457714
-26413.935546875,44.704912185668945,9005.7476272583,8961.042715072632,1796.1026364348447
-26365.220703125,56.15815734863281,8989.444319725037,8933.286162376404,425.68790733196573
-26098.8828125,8.778548955917358,8905.729065656662,8896.950516700745,998.3742723239582
-26359.28515625,35.5607328414917,8990.167922019958,8954.607189178467,1791.952147897343
-26167.248046875,2.092721939086914,8929.601099014282,8927.508377075195,780.288890922225
-26859.23046875,56.07120990753174,9152.583735466003,9096.512525558472,958.292622813631
-26618.103515625,22.339953422546387,9076.740940093994,9054.400986671448,2417.5716534007747
-26682.677734375,25.385876655578613,9097.903415679932,9072.517539024353,918.4131609016296
-26836.30859375,30.402664184570312,9148.501388549805,9118.098724365234,3385.164651845454
-26921.97265625,35.0601749420166,9176.39433002472,9141.334155082703,1726.79606519153
-27088.294921875,45.33115291595459,9230.22274684906,9184.891593933105,884.4746648383568
-26598.970703125,10.442298889160156,9072.771814346313,9062.329515457153,1231.6912229240297
-27187.4765625,32.73748588562012,9264.436058998108,9231.698573112488,2674.3656891398964
-27052.8046875,8.036879062652588,9222.351951122284,9214.315072059631,1230.1025536750471
-26407.1015625,-4.464114189147949,9011.468688964844,9015.932803153992,602.7700183039614
-27296.173828125,25.040968894958496,9301.440532684326,9276.399563789368,748.2821031111324
-27424.19921875,35.46286487579346,9342.992858886719,9307.529994010925,3984.155988417536
-27237.072265625,11.93520736694336,9283.95475101471,9272.019543647766,928.2940334823722
-27675.162109375,44.595590591430664,9424.967468261719,9380.371877670288,374.5438916278181
-26976.55078125,-16.825137615203857,9201.341971874237,9218.167109489441,1369.1602567107427
-27274.509765625,-14.790919303894043,9298.90145111084,9313.692370414734,1123.9557290121868
-27594.74609375,17.33217430114746,9401.611535072327,9384.27936077118,815.5744145539511
-27457.517578125,11.837479591369629,9356.932850837708,9345.095371246338,1020.5820761739948
-27789.869140625,23.51883316040039,9465.552613258362,9442.033780097961,906.3627797795801
-27878.908203125,19.74335765838623,9495.88311958313,9476.139761924744,1553.002010868461
-26936.25390625,-58.78286558389664,9192.735407292843,9251.51827287674,1358.6959231458245
-27669.05859375,2.0077028274536133,9428.704275131226,9426.696572303772,374.13417120335043
-28183.1484375,23.785059928894043,9595.630686759949,9571.845626831055,901.1390544518819
-27683.673828125,-21.665173053741455,9436.209352016449,9457.87452507019,2911.0297866838155
-28072.84765625,9.49476146697998,9561.356612205505,9551.861850738525,1043.7005780736986
-27452.044921875,-71.37403357028961,9364.740421652794,9436.114455223083,1903.7652443624102
-27657.107421875,-26.477441787719727,9427.821182250977,9454.298624038696,1050.1341233953037
-27817.212890625,-15.845685958862305,9480.036573410034,9495.882259368896,1585.5843594997903
-28125.2265625,-1.095189094543457,9580.224551200867,9581.31974029541,866.1573510060723
-28353.173828125,1.1003103256225586,9655.518912315369,9654.418601989746,646.2463529874781
-28554.169921875,26.398125648498535,9718.704266548157,9692.306140899658,1594.8716336695031
-28386.4375,-6.973230361938477,9667.10684299469,9674.080073356628,372.1787565158014
-28046.775390625,-29.097119629383087,9557.987798392773,9587.084918022156,971.182380663007
-28139.826171875,-29.183547735214233,9588.63169836998,9617.815246105194,369.81378939773356
-28439.890625,9.612360000610352,9683.33094215393,9673.71858215332,375.88830091201305
-28486.310546875,-4.5952606201171875,9700.395977020264,9704.99123764038,742.8389085923008
-28948.373046875,14.325858116149902,9851.493304252625,9837.167446136475,567.9980450087874
-28429.630859375,-22.27744770050049,9684.033172607422,9706.310620307922,841.1726082688882
-28417.876953125,-30.50321388244629,9680.864002227783,9711.36721611023,1553.8964231189389
-28601.353515625,-7.679114818572998,9739.448589801788,9747.127704620361,804.2616505213359
-28470.88671875,-11.392637252807617,9697.112998008728,9708.505635261536,1052.7524945927616
-28596.34765625,-21.20909595489502,9739.205721855164,9760.414817810059,1504.8085981923969
-29067.310546875,13.801071166992188,9891.255224227905,9877.454153060913,2263.4962209650744
-27538.2421875,-98.66130495071411,9398.31980085373,9496.981105804443,908.914792370479
-29036.98828125,2.850600242614746,9882.551445960999,9879.700845718384,1029.8775504650062
-29202.66015625,12.750965118408203,9936.304735183716,9923.553770065308,514.8903443640556
-29136.486328125,-1.6474685668945312,9915.49806022644,9917.145528793335,838.337917961346
-29147.955078125,9.44048023223877,9918.516353607178,9909.075873374939,398.92318513775575
-29088.5,-0.2160940170288086,9900.244861602783,9900.460955619812,844.3058484539052
-29154.189453125,-4.156863212585449,9922.397033691406,9926.553896903992,3008.8666681714826
-29114.984375,-5.376982688903809,9909.418150901794,9914.795133590698,1071.4882611242533
-29225.115234375,6.994731903076172,9944.68807888031,9937.693346977234,1028.4951909731158
-29433.294921875,15.900323867797852,10013.020153045654,9997.119829177856,1061.8342504263394
-29339.974609375,-6.086660385131836,9984.2026014328,9990.289261817932,362.0171026009011
-28936.412109375,-41.36186695098877,9854.881847381592,9896.24371433258,1307.3476321391959
-28069.578125,-115.67397832870483,9576.585867404938,9692.259845733643,848.6616489829761
-29684.291015625,12.995431900024414,10096.310218811035,10083.31478691101,1182.3824812629205
-29290.966796875,-15.238109588623047,9969.364786148071,9984.602895736694,903.5946561740093
-29131.36328125,-51.68459415435791,9920.612798690796,9972.297392845154,851.8636701688648
-29458.99609375,6.929084777832031,10023.156554222107,10016.227469444275,1996.0502952712277
-29603.345703125,-6.847092628479004,10071.873503684998,10078.720596313477,2165.3092644102517
-29608.255859375,-13.855868339538574,10074.644145011902,10088.50001335144,963.6005170953024
-29474.67578125,-20.31843876838684,10031.243992567062,10051.56243133545,387.7676254845627
-28988.361328125,-48.606672286987305,9873.25006389618,9921.856736183167,858.7031115012002
-29917.71484375,16.43564796447754,10173.645893096924,10157.210245132446,1584.8272307115922
-30086.9921875,15.420284271240234,10229.433776855469,10214.013492584229,1857.8422324421358
-29389.9453125,-40.40403079986572,10005.354957580566,10045.758988380432,966.8049244058127
-29350.884765625,-54.97854709625244,9993.97396659851,10048.952513694763,891.2854702272241
-29495.15234375,-29.34712505340576,10039.566641807556,10068.913766860962,1931.7943431011051
-29590.24609375,-21.199252128601074,10069.988061904907,10091.187314033508,562.1692695639006
-30018.0078125,-0.02349090576171875,10208.827250480652,10208.850741386414,1741.1793326172192
-28652.822265625,-102.89616894721985,9768.073320388794,9870.969489336014,544.7602012606491
-29503.703125,-69.10645771026611,10045.90556716919,10115.012024879456,973.7197596269722
-30018.83984375,1.3195610046386719,10208.98192691803,10207.662365913391,523.9524471680602
-30003.4921875,-8.363675117492676,10205.490258216858,10213.85393333435,836.2280542602881
-29039.27734375,-142.81830739974976,9900.78092288971,10043.59923028946,2585.762502286706
-30147.283203125,-13.368107795715332,10253.273701667786,10266.641809463501,1000.2883531095358
-29831.7265625,-28.070833683013916,10150.74423456192,10178.815068244934,1408.5831568551
-30344.953125,4.222196578979492,10316.58533859253,10312.36314201355,982.4890979562472
-29922.626953125,-17.000202178955078,10179.612112045288,10196.612314224243,372.5478904464885
-29317.767578125,-102.87482690811157,9988.997520923615,10091.872347831726,377.14870034851936
-29767.875,-46.79383659362793,10131.76810836792,10178.561944961548,378.40463108083054
-30026.45703125,-18.088857650756836,10214.826636314392,10232.915493965149,1029.201431305477
-30380.5703125,4.461706161499023,10329.104661941528,10324.64295578003,1088.68535676191
-29980.41796875,-37.45751619338989,10201.016923427582,10238.474439620972,834.6183900791523
-30429.80859375,-8.749231338500977,10347.542908668518,10356.292140007019,1030.485381868024
-29920.916015625,-37.78017520904541,10180.976121902466,10218.756297111511,1037.881766030425
-30163.2421875,-25.39371395111084,10260.557558059692,10285.951272010803,797.2709738577131
-29867.7109375,-101.83203315734863,10171.095314979553,10272.927348136902,412.8647273223809
-29228.74609375,-126.21365928649902,9961.63512802124,10087.84878730774,2577.608974883013
-29987.1328125,-64.89433908462524,10206.281621456146,10271.175960540771,1043.7874702238098
-30145.107421875,-60.24418497085571,10259.404082775116,10319.648267745972,1378.4074207835822
-29930.521484375,-52.37277317047119,10186.400740623474,10238.773513793945,1259.1620486199415
-30802.08203125,12.925058364868164,10467.741775512695,10454.816717147827,1339.639463329803
-29704.56640625,-74.09457033872604,10114.654133617878,10188.748703956604,979.9649738112239
-30432.478515625,-31.13486385345459,10350.485383987427,10381.620247840881,1123.7865398845138
-30872.572265625,13.070082664489746,10491.363247871399,10478.29316520691,1041.7828520233204
-30552.88671875,-15.639952659606934,10388.820211410522,10404.46016407013,357.5528918351781
-30198.548828125,-72.69724750518799,10277.888583183289,10350.585830688477,1664.1339595266927
-30231.185546875,-58.050371170043945,10287.267166137695,10345.31753730774,580.3999941377505
-30570.849609375,-31.93666362762451,10396.583882331848,10428.520545959473,1803.1788735352616
-30218.7265625,-81.30515968799591,10285.41570341587,10366.720863103867,911.7569261982245
-29948.30859375,-72.21884822845459,10194.9129114151,10267.131759643555,1964.286688905886
-29868.1640625,-120.98399543762207,10173.903006076813,10294.887001514435,908.1995241065007
-30833.599609375,-2.770404815673828,10480.422080039978,10483.192484855652,419.9149376062118
-30661.484375,-22.330121994018555,10426.091032028198,10448.421154022217,729.8608441179448
-30699.513671875,-27.414189338684082,10438.887952804565,10466.30214214325,1017.6397466310154
-30932.90234375,-1.9516544342041016,10513.314050674438,10515.265705108643,1673.6731424468076
-29771.0546875,-131.8536958694458,10143.820324897766,10275.674020767212,1298.9325210124198
-29922.474609375,-114.35656523704529,10191.335213899612,10305.691779136658,386.646631596572
-31198.146484375,3.5650758743286133,10600.672533988953,10597.107458114624,1246.9834827164807
-30730.49609375,-37.842867851257324,10450.474576950073,10488.31744480133,956.1618641143832
-30314.564453125,-62.01649856567383,10315.733095169067,10377.749593734741,1132.3278352428551
-30830.7578125,-34.11969470977783,10483.335141181946,10517.454835891724,1058.511156140522
-30885.544921875,-20.285330772399902,10500.062601089478,10520.347931861877,1603.0566329240119
-30478.95703125,-70.22339981794357,10370.925139725208,10441.148539543152,900.3748524629096
-30523.310546875,-105.44698476791382,10388.836641788483,10494.283626556396,1220.6951378878211
-31024.853515625,-48.65081214904785,10549.166849136353,10597.8176612854,1120.996726315012
-30394.5078125,-81.60861873626709,10344.702582359314,10426.311201095581,896.992865052204
-31048.962890625,-13.940500259399414,10553.599000930786,10567.539501190186,3055.9708743548645
-29854.423828125,-194.11853766441345,10177.935511827469,10372.054049491882,372.04682252041556
-31094.61328125,-18.2863130569458,10569.558512687683,10587.844825744629,897.3337275186884
-30070.138671875,-160.97341012954712,10245.202261447906,10406.175671577454,1014.3544426136644
-29953.53125,-128.1266086101532,10202.964475870132,10331.091084480286,503.59098096731776
-30966.142578125,-40.60532760620117,10529.11286354065,10569.71819114685,372.66796230070935
-31446.779296875,-6.372676849365234,10684.535972595215,10690.90864944458,1214.4084876300158
-30203.658203125,-140.40939116477966,10288.358607053757,10428.767998218536,1356.8656514020377
-30462.32421875,-40.884084701538086,10361.984397888184,10402.868482589722,368.2847185388555
-31324.103515625,-26.079514503479004,10645.833411216736,10671.912925720215,847.9563637855907
-30273.22265625,-143.75195050239563,10311.10548567772,10454.857436180115,373.7913389458295
-31569.94140625,-13.035480499267578,10726.027341842651,10739.062822341919,355.5836943430872
-30884.013671875,-34.490750312805176,10501.994245529175,10536.48499584198,4176.276133976514
-31060.2890625,-67.57308387756348,10563.39697265625,10630.970056533813,1828.2611495810713
-31078.01171875,-93.8839066028595,10573.008940458298,10666.892847061157,1008.2355737196431
-29629.716796875,-228.18692922592163,10106.184466838837,10334.371396064758,1085.0177140032354
-31663.431640625,2.770711898803711,10756.048105239868,10753.277393341064,517.714581964951
-30576.48828125,-84.43094253540039,10405.630162239075,10490.061104774475,871.9791697851718
-31556.44921875,-13.768885612487793,10722.051642417908,10735.820528030396,1338.4757281159898
-29263.33984375,-218.17213022708893,9985.10935986042,10203.28149008751,656.8679799490568
-30442.46875,-159.3985242843628,10369.622188568115,10529.020712852478,1623.892682115579
-30278.1171875,-143.10677802562714,10313.553473114967,10456.660251140594,730.2742580376674
-30740.287109375,-140.98639297485352,10465.17210483551,10606.158497810364,947.7644863280744
-30671.431640625,-89.51119613647461,10436.920426368713,10526.431622505188,955.874070840331
-31933.041015625,10.686481475830078,10843.929964065552,10833.243482589722,837.6261553165803
-30681.1171875,-108.67649745941162,10442.88014793396,10551.556645393372,909.6135296298085
-31432.37109375,-42.93804740905762,10684.293964385986,10727.232011795044,2190.551524957103
-31797.873046875,-20.937198638916016,10802.347036361694,10823.28423500061,880.4659275621204
-31085.689453125,-78.69407606124878,10573.76664686203,10652.460722923279,882.904158106539
-29536.287109375,-275.04863595962524,10081.814577579498,10356.863213539124,1162.3064047784726
-29074.275390625,-323.40849351882935,9934.716580867767,10258.125074386597,574.8829706364106
-31655.15625,-21.025168418884277,10755.96877002716,10776.993938446045,1014.827934943266
