loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,8.40902279931575
-3150.331787109375,791.5011463239789,4356.5974421054125,3565.0962957814336,718.5351447409206
-4364.498046875,85.08328819274902,5909.615986824036,5824.532698631287,1017.6592399306451
-4701.52490234375,42.894710540771484,6332.618059158325,6289.723348617554,751.4264607177454
-4924.576171875,20.447505950927734,6612.0940618515015,6591.646555900574,4536.428126756386
-5112.8359375,-11.658029556274414,6849.125611305237,6860.783640861511,2763.4430538276733
-5275.63916015625,-29.729248046875,7053.31814289093,7083.047390937805,3983.4875803766636
-5411.97412109375,-39.124738693237305,7224.233016014099,7263.357754707336,2677.9451102377166
-5478.30712890625,-52.12898349761963,7308.040374755859,7360.169358253479,864.875410617004
-5586.22705078125,-60.56668472290039,7443.252528190613,7503.819212913513,1944.7346810777854
-5702.47802734375,-59.03759956359863,7588.074837684631,7647.11243724823,2123.26520827438
-5751.54150390625,-60.08993721008301,7649.550851821899,7709.640789031982,1669.2125933729444
-5845.0146484375,-74.27678775787354,7767.114971160889,7841.391758918762,2185.7320078705807
-5903.0341796875,-68.63247871398926,7839.177930831909,7907.810409545898,1428.600053980045
-5938.962890625,-73.49201965332031,7884.386870384216,7957.878890037537,3069.0189011220828
-6004.08544921875,-83.1326675415039,7966.244409561157,8049.377077102661,1582.5758675579718
-6005.6337890625,-88.01752662658691,7968.984209060669,8057.001735687256,2129.5590740504576
-6096.77294921875,-82.75026607513428,8082.129668235779,8164.879934310913,1248.0845633637437
-6138.2333984375,-89.00079727172852,8134.359894752502,8223.360692024231,1405.795490796995
-6181.6298828125,-93.4766616821289,8188.724862098694,8282.201523780823,797.4551094907594
-6230.408203125,-94.8531379699707,8249.582286834717,8344.435424804688,2678.961227571171
-6233.90576171875,-99.00592136383057,8254.393741607666,8353.399662971497,1869.4038368962886
-6288.42138671875,-93.27470207214355,8321.994174957275,8415.268877029419,2408.925070793233
-6197.5322265625,-118.20850443840027,8210.997295618057,8329.205800056458,3554.366466750647
-6313.26611328125,-98.63179111480713,8353.548733711243,8452.18052482605,2519.2700295576274
-6370.88037109375,-93.77577781677246,8425.128203392029,8518.903981208801,788.1988224739744
-6410.46630859375,-97.62082862854004,8474.713688850403,8572.334517478943,1998.7622364631845
-6421.98876953125,-95.88187885284424,8488.985620498657,8584.867499351501,1749.599395466052
-6402.00927734375,-107.37128829956055,8465.09866142273,8572.46994972229,1100.067644867878
-6496.150390625,-101.03439235687256,8581.76027393341,8682.794666290283,652.6056482682463
-6484.8701171875,-103.14763069152832,8567.963150978088,8671.110781669617,1870.0522315674089
-6530.35546875,-96.56578254699707,8624.21663570404,8720.782418251038,1983.6232656936302
-6428.90576171875,-122.1787600517273,8500.005156040192,8622.183916091919,2183.0340774665424
-6548.40234375,-121.06606483459473,8648.610876083374,8769.676940917969,1519.4609633893187
-6562.5791015625,-103.29383182525635,8665.159742355347,8768.453574180603,1262.3066397125237
-6553.12158203125,-118.27897644042969,8654.499733924866,8772.778710365295,3004.2793759668803
-6644.64794921875,-101.45718002319336,8767.417722702026,8868.87490272522,2013.8783201671158
-6625.66552734375,-118.88922214508057,8745.05465221405,8863.94387435913,1931.251364128551
-6579.2626953125,-133.43694877624512,8688.403950691223,8821.840899467468,1095.315430615073
-6591.84814453125,-157.15023612976074,8706.363883972168,8863.514120101929,1268.2321062034243
-6530.00830078125,-133.46740913391113,8626.588618278503,8760.056027412415,1652.0744624599874
-6691.33642578125,-116.81768226623535,8826.9241771698,8943.741859436035,1546.3841074291338
-6761.740234375,-103.58932781219482,8913.734492301941,9017.323820114136,1469.1464885534608
-6776.45703125,-105.75446128845215,8932.259464263916,9038.013925552368,2060.924971413007
-6773.78466796875,-120.18647384643555,8929.866743087769,9050.053216934204,649.6711804874093
-6769.396484375,-115.54691219329834,8924.333688735962,9039.88060092926,2385.0751094624734
-6814.75732421875,-110.50819301605225,8980.651633262634,9091.159826278687,1405.3095712589238
-6831.9765625,-118.61124897003174,9002.52528476715,9121.136533737183,978.2276673676005
-6871.5234375,-105.20337295532227,9050.924771308899,9156.128144264221,2369.817693789374
-6840.75390625,-118.73810482025146,9013.753603935242,9132.491708755493,1414.3870323308256
-6919.943359375,-108.59104347229004,9111.609313964844,9220.200357437134,2370.78551024178
-6889.7958984375,-115.67232894897461,9074.700077056885,9190.37240600586,1572.3786192347013
-6808.28076171875,-155.90278911590576,8975.893407821655,9131.796196937561,2044.7599661224738
-6858.54833984375,-134.54900979995728,9037.274587154388,9171.823596954346,1583.4067728185505
-6926.5068359375,-124.26945209503174,9121.077680587769,9245.3471326828,2160.469228830453
-6977.7158203125,-117.06168460845947,9184.279977798462,9301.341662406921,1617.0230245493053
-6912.689453125,-129.25295162200928,9104.377243995667,9233.630195617676,668.0705181176403
-6992.84716796875,-121.49270629882812,9203.51640701294,9325.009113311768,1057.8802964655802
-6924.4052734375,-138.10898399353027,9119.610877990723,9257.719861984253,1129.1542275613642
-6989.9072265625,-123.76248073577881,9200.188063621521,9323.9505443573,1095.8733356207294
-7076.27490234375,-114.73722457885742,9307.122575759888,9421.859800338745,1175.7645041583278
-6911.70166015625,-162.7683744430542,9106.078874588013,9268.847249031067,1126.9409109777578
-7001.66162109375,-125.93083381652832,9215.14708328247,9341.077917098999,2682.999760314064
-7125.56201171875,-114.6194953918457,9368.808420181274,9483.42791557312,1702.1743391842947
-6985.296875,-142.4332447052002,9196.280746459961,9338.713991165161,1724.5466703233847
-7132.40380859375,-117.43105602264404,9377.530913352966,9494.96196937561,1404.7867241131191
-7140.09912109375,-123.30716705322266,9387.33688545227,9510.644052505493,2826.8671725389354
-7150.7158203125,-122.07369899749756,9400.69612789154,9522.769826889038,1702.019442168242
-7082.00732421875,-128.3787670135498,9315.694912910461,9444.073679924011,1826.49685926429
-7147.27880859375,-119.86452960968018,9396.540858268738,9516.405387878418,2159.6423942419424
-7175.9296875,-119.06468963623047,9432.26484489441,9551.32953453064,1361.94979065173
-7065.49951171875,-157.8055590391159,9297.360121846199,9455.165680885315,2580.067050903551
-7161.72265625,-138.1609649658203,9415.708805084229,9553.869770050049,1942.651391203367
-7121.43115234375,-139.2840394973755,9365.939633369446,9505.223672866821,1160.3729660224074
-7075.97412109375,-160.86611080169678,9311.066221237183,9471.93233203888,749.5225221505527
-7277.41357421875,-114.3470230102539,9558.356496810913,9672.703519821167,2621.2205591612333
-7211.2919921875,-130.4972620010376,9477.169622421265,9607.666884422302,1011.2029496624265
-7240.35791015625,-132.00790214538574,9513.473950386047,9645.481852531433,1402.7675676019799
-7296.14013671875,-116.2021598815918,9581.896802902222,9698.098962783813,2131.9035080682347
-7265.45556640625,-119.49461269378662,9544.038041114807,9663.532653808594,2399.688397859394
-7190.50927734375,-139.67443656921387,9452.08869934082,9591.763135910034,1044.835634317802
-7212.4580078125,-151.35383224487305,9480.460919380188,9631.814751625061,1738.811793972218
-7107.3408203125,-203.1336531639099,9353.066259860992,9556.199913024902,2293.0237188995347
-7259.53125,-134.58436393737793,9538.024580001831,9672.608943939209,2703.95173223589
-7331.658203125,-123.01084232330322,9626.942700386047,9749.95354270935,1457.2444381284506
-7378.56201171875,-117.90483665466309,9684.97713470459,9802.881971359253,2495.3543592750884
-7314.56298828125,-138.6832914352417,9606.943797111511,9745.627088546753,992.0700224142864
-7385.2568359375,-114.4610824584961,9693.085033416748,9807.546115875244,881.8692407335724
-7380.04736328125,-119.36635971069336,9687.14674949646,9806.513109207153,1861.026339066965
-7358.32666015625,-133.29471111297607,9661.228611946106,9794.523323059082,1256.3534672651988
-7144.55712890625,-208.52130895853043,9400.513831555843,9609.035140514374,2529.557106797171
-7331.90478515625,-124.80766582489014,9627.507313728333,9752.314979553223,2813.8655796699245
-7435.755859375,-112.83057308197021,9756.309348106384,9869.139921188354,1577.5376645921624
-7425.66748046875,-131.38326263427734,9744.852602005005,9876.235864639282,2449.953794133279
-7261.5673828125,-178.82307279109955,9544.344042420387,9723.167115211487,2077.4087199302962
-7482.03271484375,-108.45200538635254,9813.698392868042,9922.150398254395,1609.2220204821529
-7479.53662109375,-119.52141189575195,9811.424019813538,9930.94543170929,1731.402622432753
-7481.71044921875,-125.70971298217773,9814.680294036865,9940.390007019043,1084.4859284069182
-7476.6201171875,-119.83832263946533,9807.828490257263,9927.666812896729,1261.9204221727084
-7531.72900390625,-131.21117115020752,9877.258482933044,10008.469654083252,2070.104042555559
-7534.556640625,-112.06357192993164,9879.469730377197,9991.533302307129,1117.4609058787926
-7477.86962890625,-128.58599853515625,9810.123396873474,9938.70939540863,5256.84111350623
-7440.94775390625,-163.62374877929688,9766.679983139038,9930.303731918335,2234.833872308327
-7530.9833984375,-129.63431358337402,9876.425979614258,10006.060293197632,607.241318148446
-7533.7177734375,-127.53720188140869,9879.820950508118,10007.358152389526,2705.1966153858107
-7375.81787109375,-177.74622297286987,9686.675584316254,9864.421807289124,1918.4728466031402
-7600.72412109375,-111.01111221313477,9962.050910949707,10073.062023162842,1401.4830924267583
-7549.6572265625,-126.37248992919922,9899.53451538086,10025.907005310059,1888.5687783743329
-7567.126953125,-131.61338996887207,9921.904227256775,10053.517617225647,2420.282127295222
-7581.36767578125,-129.58066082000732,9939.383105278015,10068.963766098022,1794.1591927135498
-7433.501953125,-170.5705051422119,9758.476511001587,9929.047016143799,1220.126891404155
-7605.4814453125,-134.0554599761963,9969.563293457031,10103.618753433228,1060.1123923913685
-7535.4140625,-142.28551244735718,9883.227014064789,10025.512526512146,1913.1482187002327
-7634.49853515625,-128.61235904693604,10005.766995429993,10134.379354476929,2285.8776622385853
-7601.80126953125,-133.37736892700195,9965.301089286804,10098.678458213806,908.3191247495114
-7447.40185546875,-180.51112949848175,9776.185819029808,9956.69694852829,2548.9185520440283
-7702.05712890625,-123.55898094177246,10089.598602294922,10213.157583236694,1088.6748009242908
-7703.2109375,-116.59729290008545,10090.433848381042,10207.031141281128,2625.056286626518
-7694.68017578125,-124.96166229248047,10080.444686889648,10205.406349182129,1785.0965194989315
-7624.6328125,-133.17971229553223,9993.74254322052,10126.922255516052,1223.316938877342
-7581.9169921875,-164.7786054611206,9942.793703079224,10107.572308540344,1143.0529375542026
-7658.16845703125,-152.41061305999756,10037.057294845581,10189.467907905579,1317.8480469490198
-7575.1298828125,-151.0544159412384,9933.716040372849,10084.770456314087,1774.0129064608077
-7735.8798828125,-120.83707809448242,10131.674055099487,10252.51113319397,1160.1546908728596
-7626.3974609375,-154.72810649871826,9997.65293598175,10152.381042480469,929.5225419885758
-7631.1162109375,-160.9600796699524,10003.815968036652,10164.776047706604,3679.3274915662273
-7745.39599609375,-125.44855308532715,10143.949216842651,10269.397769927979,2249.5295644570433
-7558.16162109375,-193.05024194717407,9915.562333583832,10108.612575531006,2787.7375098020766
-7744.150390625,-138.02135848999023,10143.40825843811,10281.4296169281,3377.5838553970184
-7693.00048828125,-161.16987133026123,10081.40334033966,10242.573211669922,2267.951726181296
-7725.93017578125,-139.52428150177002,10120.854451179504,10260.378732681274,2646.5823353819846
-7713.1083984375,-139.60859203338623,10104.717679023743,10244.326271057129,1032.2603327311929
-7799.7900390625,-129.1065797805786,10212.11077594757,10341.21735572815,2059.0190871813365
-7693.677734375,-160.2147159576416,10082.107711791992,10242.322427749634,1985.2645161496048
-7781.67041015625,-140.5109806060791,10190.378269195557,10330.889249801636,1579.4051388570479
-7707.32763671875,-134.9731011390686,10097.513540744781,10232.48664188385,2932.115248223253
-7821.8740234375,-139.75504684448242,10240.279899597168,10380.03494644165,1500.8567113961076
-7746.01708984375,-164.7869987487793,10147.903096199036,10312.690094947815,1493.9270771734596
-7786.611328125,-132.06266498565674,10196.067008018494,10328.12967300415,1397.2140738321425
-7798.5498046875,-147.55534648895264,10212.001009941101,10359.556356430054,1132.8713559737491
-7778.865234375,-153.22566890716553,10187.76127243042,10340.986941337585,2459.233571379088
-7770.9970703125,-153.468976020813,10178.31687259674,10331.785848617554,1574.7194031120148
-7901.4462890625,-125.32607650756836,10338.645080566406,10463.971157073975,1186.1773624645825
-7787.8564453125,-153.18808460235596,10199.180706977844,10352.3687915802,2110.945957493238
-7842.52880859375,-143.01509857177734,10266.63452911377,10409.649627685547,1582.8247615115513
-7883.03955078125,-134.84794998168945,10316.454708099365,10451.302658081055,3579.8142386484396
-7923.0517578125,-132.02830505371094,10366.0837059021,10498.11201095581,2390.4125310186655
-7917.61376953125,-128.36543655395508,10359.152347564697,10487.517784118652,2869.4130828010543
-7619.5751953125,-224.6457543373108,9994.819416046143,10219.465170383453,3092.2537274435135
-7862.88427734375,-150.8916997909546,10292.548954963684,10443.440654754639,2637.6758118080625
-7941.81494140625,-131.59956169128418,10389.741201400757,10521.340763092041,637.0092490100618
-7884.41259765625,-151.38242626190186,10319.569073677063,10470.951499938965,2557.5202477754815
-7948.63671875,-138.22872161865234,10398.463766098022,10536.692487716675,2164.7513418079816
-7814.2900390625,-176.7574758529663,10233.907506942749,10410.664982795715,1098.0305719234248
-7855.2822265625,-180.42637634277344,10285.303123474121,10465.729499816895,1026.4031128061445
-7913.755859375,-184.37992334365845,10358.65539598465,10543.035319328308,2456.6990640094614
-7704.470703125,-195.45672130584717,10097.767437934875,10293.224159240723,1488.578772089125
-7838.55126953125,-184.34732055664062,10264.811570167542,10449.158890724182,2781.5976640075423
-7979.40185546875,-130.924298286438,10436.570233345032,10567.49453163147,1006.793070102902
-7751.8515625,-241.02598810195923,10160.829093456268,10401.855081558228,2060.0951353472524
-7975.82421875,-139.61434078216553,10432.87729549408,10572.491636276245,5140.4966683403945
-7921.611328125,-155.81990814208984,10366.361866950989,10522.181775093079,608.1663805860918
-7989.134765625,-147.77330207824707,10449.880352020264,10597.65365409851,5207.630778538787
-7871.3583984375,-198.57594394683838,10306.968665122986,10505.544609069824,1390.5551266910809
-7842.21630859375,-177.41381168365479,10268.935826301575,10446.34963798523,1927.0366557343784
-7955.95361328125,-154.1926498413086,10409.104053497314,10563.296703338623,408.03941693254046
-7793.27734375,-208.5760269165039,10210.35388469696,10418.929911613464,937.7272449502067
-7742.81396484375,-225.20615935325623,10148.420689821243,10373.6268491745,1010.097791827934
-8064.01708984375,-129.20252799987793,10541.982332229614,10671.184860229492,1225.2570141428012
-8055.56494140625,-127.56337261199951,10531.410046577454,10658.973419189453,1088.515647893366
-7882.1201171875,-212.62796592712402,10321.004893302917,10533.632859230042,3959.323053121129
-7878.4189453125,-185.89093589782715,10315.002290725708,10500.893226623535,1699.9372456351043
-8067.78173828125,-139.34727954864502,10547.531304359436,10686.878583908081,613.6008992608258
-8060.26513671875,-136.35155487060547,10538.025993347168,10674.377548217773,1497.8564560273385
-7996.54150390625,-161.7203950881958,10460.375388145447,10622.095783233643,1061.645346499486
-8033.29638671875,-154.33980751037598,10505.738718986511,10660.078526496887,2023.8288065362785
-8074.00537109375,-147.11950397491455,10555.961939811707,10703.081443786621,1085.219075255206
-8046.1572265625,-145.78978633880615,10521.167328834534,10666.95711517334,620.1744028524121
-7979.7724609375,-182.16155624389648,10441.07144355774,10623.232999801636,620.3941170505113
-7935.59716796875,-211.70679378509521,10388.252108573914,10599.958902359009,3066.029005017235
-8159.21533203125,-123.02685928344727,10660.526430130005,10783.553289413452,1706.418760711841
-7923.3173828125,-222.1272029876709,10373.608515739441,10595.735718727112,1299.9398806476215
-8075.78857421875,-144.25639533996582,10558.208130836487,10702.464526176453,2071.0681596896407
-7939.1806640625,-184.72863340377808,10390.902988910675,10575.631622314453,1086.4334805647845
-8080.78369140625,-168.80043697357178,10565.90706539154,10734.707502365112,1229.3087189614776
-7886.36669921875,-235.68344736099243,10328.968752384186,10564.652199745178,1684.0601920240028
-8101.36328125,-147.51603507995605,10590.339618682861,10737.855653762817,1030.3257571811241
-8088.2919921875,-156.81171703338623,10574.716391563416,10731.528108596802,2256.391266729319
-8019.15478515625,-172.43602085113525,10489.348742485046,10661.784763336182,2665.748993118775
-7973.40576171875,-221.88122463226318,10436.069783210754,10657.951007843018,1031.30906061416
-8136.181640625,-158.2095823287964,10634.611562728882,10792.821145057678,2771.171894087337
-8163.05419921875,-135.72906684875488,10666.071779251099,10801.800846099854,2153.362030514242
-8016.22705078125,-189.39380359649658,10487.274317741394,10676.66812133789,1617.7057015093587
-7726.11572265625,-287.9093985557556,10133.400738239288,10421.310136795044,1113.5471881682263
-8218.1142578125,-139.79763412475586,10735.266096115112,10875.063730239868,633.1166792167635
-8132.0126953125,-145.5789966583252,10628.35878944397,10773.937786102295,1063.2705896300888
-8012.44677734375,-196.1860113143921,10483.292084693909,10679.4780960083,1195.3759027688031
-8191.916015625,-133.46612644195557,10702.412850379944,10835.8789768219,1028.0558589919106
-7978.55810546875,-233.86512994766235,10443.388256549835,10677.253386497498,1055.0786869185915
-8223.83984375,-138.89378356933594,10742.209733963013,10881.103517532349,1422.4404820173907
-8049.09423828125,-186.58156394958496,10528.359062194824,10714.94062614441,979.1042630891167
