loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,2.476780167067701
-2116.977783203125,881.06887806952,4157.275845512748,3276.2069674432278,2544.7661384870235
-3023.462890625,200.1207413673401,5750.572986602783,5550.452245235443,1303.345641269284
-3277.939697265625,188.15957355499268,6167.933316230774,5979.773742675781,875.6825711516962
-3484.986572265625,180.3539171218872,6508.91019153595,6328.5562744140625,3477.771430015309
-3565.366943359375,181.24583196640015,6641.8385491371155,6460.592717170715,573.40305811482
-3656.92041015625,184.49355554580688,6793.072016239166,6608.578460693359,507.12012221118533
-3772.209716796875,197.77582931518555,6977.914720535278,6780.138891220093,543.4374843929716
-3872.133544921875,180.3083724975586,7146.09613609314,6965.787763595581,566.885870416643
-3896.655517578125,161.82128143310547,7191.445792198181,7029.624510765076,1463.643194119983
-3984.34765625,165.96346378326416,7333.912069320679,7167.948605537415,1301.532277148065
-4050.4541015625,154.13873481750488,7445.647753715515,7291.50901889801,965.624114354525
-4040.12548828125,141.44647693634033,7433.703022003174,7292.2565450668335,1823.1047491657803
-4049.388916015625,116.45774492621422,7455.751393169165,7339.29364824295,1203.8411223745493
-4178.95361328125,132.95969772338867,7663.487943649292,7530.528245925903,911.2611511124819
-4244.48291015625,135.7567481994629,7771.007287025452,7635.250538825989,1102.7863034431266
-4224.18994140625,117.56814527511597,7743.777587413788,7626.209442138672,2407.0011278306206
-4324.52783203125,128.73492431640625,7905.0982837677,7776.363359451294,1803.4107468510283
-4241.2802734375,83.54615879058838,7780.7480664253235,7697.201907634735,1551.8144255401958
-4401.3134765625,111.39634799957275,8036.4472761154175,7925.050928115845,541.4502240653427
-4410.5634765625,113.45974540710449,8051.464987754822,7938.005242347717,1920.8957017057592
-4294.31982421875,64.29587888717651,7876.011688709259,7811.7158098220825,866.4148146930492
-4449.40478515625,113.2945203781128,8116.527704238892,8003.233183860779,715.0408765918881
-4531.1025390625,105.0913028717041,8253.558581352234,8148.46727848053,860.3785974444672
-4499.59033203125,88.33934307098389,8206.072759151459,8117.733416080475,487.79763254142836
-4520.14013671875,82.26440382003784,8241.777136325836,8159.512732505798,957.144865655014
-4603.11474609375,94.57942867279053,8374.997952461243,8280.418523788452,761.717945896116
-4634.208984375,91.45252704620361,8426.810183525085,8335.357656478882,1501.1019511899858
-4618.18505859375,67.3113431930542,8406.081987380981,8338.770644187927,577.9657749361957
-4597.45361328125,66.80188220739365,8373.697292745113,8306.89541053772,449.30827864268645
-4663.154296875,74.67491722106934,8479.398435592651,8404.723518371582,455.13686990380876
-4666.75341796875,66.38756370544434,8488.175506591797,8421.787942886353,1026.8428530830895
-4730.44091796875,81.17377758026123,8588.448637962341,8507.27486038208,452.54100592480233
-4798.35888671875,80.92626285552979,8699.814460754395,8618.888197898865,1395.4175421608418
-4725.42236328125,68.48808002471924,8583.997341156006,8515.509261131287,961.2642395011112
-4746.880859375,63.47432899475098,8620.460188865662,8556.98585987091,2973.036155405885
-4663.45556640625,39.40511131286621,8490.346901893616,8450.94179058075,1979.32581945591
-4855.6767578125,69.08429050445557,8797.312317848206,8728.22802734375,1109.2525712884399
-4811.64990234375,61.821391105651855,8728.019943237305,8666.198552131653,472.27722962341403
-4785.65673828125,42.014610290527344,8690.041153907776,8648.026543617249,434.18972605705045
-4853.10009765625,65.60133266448975,8795.196907997131,8729.595575332642,842.6322478857649
-4862.8515625,66.5457649230957,8811.527173995972,8744.981409072876,464.9353439119361
-4883.27001953125,55.067941665649414,8847.240125656128,8792.172183990479,667.6662910411297
-4879.708984375,54.615610122680664,8843.076483726501,8788.46087360382,495.27387951928563
-4931.06982421875,66.26971817016602,8923.483466148376,8857.21374797821,877.3765535144893
-4907.25439453125,64.83432674407959,8886.148487091064,8821.314160346985,460.43414134707217
-4977.20068359375,71.78334712982178,8998.871520996094,8927.088173866272,469.01867572923777
-4953.6787109375,49.02760887145996,8965.465655326843,8916.438046455383,472.2034716965084
-4913.107421875,32.30678415298462,8903.9812541008,8871.674469947815,1013.4816435058093
-5011.62939453125,68.95942497253418,9056.172971725464,8987.21354675293,485.30879808703884
-5025.455078125,67.23453330993652,9079.723417282104,9012.488883972168,465.55293347956814
-5014.21875,53.36105823516846,9065.528163909912,9012.167105674744,1190.3328344695485
-5043.43701171875,66.6327953338623,9110.100700378418,9043.467905044556,823.0370786835322
-4997.01171875,48.24955177307129,9037.982286453247,8989.732734680176,472.8951343002853
-5086.01708984375,66.85318183898926,9180.410749435425,9113.557567596436,1350.153603595335
-4993.0283203125,36.41582918167114,9035.292321681976,8998.876492500305,453.26870519011203
-5109.78759765625,56.04402446746826,9222.407536506653,9166.363512039185,462.89521803838903
-5065.94287109375,43.40081310272217,9154.01437664032,9110.613563537598,353.053536089886
-5032.2861328125,31.553279399871826,9101.133877277374,9069.580597877502,552.2036741612488
-5141.59326171875,62.4964714050293,9272.976301193237,9210.479829788208,464.05381883436525
-5096.36328125,46.64082908630371,9203.083073616028,9156.442244529724,462.39941950747186
-5166.34423828125,56.84403038024902,9315.533250808716,9258.689220428467,467.58645971842236
-5145.81201171875,48.412132263183594,9283.73865699768,9235.326524734497,474.07252964262153
-5074.6904296875,28.30807876586914,9172.522343635559,9144.21426486969,410.86691032376956
-5206.4970703125,64.20242881774902,9379.849598884583,9315.647170066833,459.2018376372467
-5038.2685546875,4.470896244049072,9117.923905134201,9113.453008890152,992.2279309402134
-5190.4931640625,44.582698822021484,9359.678139686584,9315.095440864563,439.71819550005097
-5232.87548828125,53.708298683166504,9426.772656440735,9373.064357757568,457.09493016633
-5244.2216796875,52.94840431213379,9444.882423400879,9391.934019088745,487.85964724366585
-5245.39892578125,47.10491943359375,9448.96515750885,9401.860238075256,1880.6344840337679
-5182.0048828125,25.517171382904053,9350.110919952393,9324.593748569489,1130.3381288452595
-5283.8056640625,60.34064197540283,9509.004124641418,9448.663482666016,552.5463934199283
-5243.400390625,39.559882164001465,9447.930094718933,9408.370212554932,784.1486984877795
-5259.93505859375,52.29653835296631,9472.166876792908,9419.870338439941,491.7017397586651
-5245.7021484375,34.97049331665039,9453.621949195862,9418.651455879211,1062.0970644873496
-5210.14892578125,23.06608486175537,9398.63244342804,9375.566358566284,1330.689682694721
-5283.810546875,45.621352195739746,9513.428970336914,9467.807618141174,1227.0925104769801
-5204.8095703125,11.761979103088379,9392.952163696289,9381.1901845932,1107.9090643376287
-5172.9736328125,-12.38063669204712,9347.102818965912,9359.483455657959,2147.789983698566
-5083.37451171875,-38.84012222290039,9206.283389091492,9245.123511314392,330.1044113782754
-5385.79443359375,56.64170265197754,9678.481880187988,9621.84017753601,489.07171819151995
-5361.322265625,54.66858673095703,9638.834139823914,9584.165553092957,707.582927174475
-5039.32421875,-111.13629424571991,9153.239846348763,9264.376140594482,1052.5202869767422
-5206.13623046875,-15.29537844657898,9403.643295049667,9418.938673496246,457.0313650939041
-5402.2333984375,64.3050308227539,9705.133235931396,9640.828205108643,453.5832881706173
-5285.5517578125,18.823588848114014,9524.585855007172,9505.762266159058,464.2268899627261
-5413.34130859375,58.57409477233887,9724.441501617432,9665.867406845093,848.7478162371323
-5346.92333984375,34.747694969177246,9621.464261054993,9586.716566085815,1213.5246708570103
-5416.662109375,50.362388610839844,9731.402600288391,9681.040211677551,482.2122080916117
-5224.2890625,-32.99081742763519,9438.545874238014,9471.53669166565,491.8239697824601
-5424.0693359375,63.28105163574219,9740.630674362183,9677.34962272644,2039.5853784742326
-4957.85400390625,-89.70189332962036,9015.16299200058,9104.8648853302,454.3895426835213
-5470.990234375,60.58596229553223,9818.905206680298,9758.319244384766,488.56994465856883
-5306.58984375,8.830187320709229,9562.82850599289,9553.99831867218,469.1435480838633
-5333.806640625,8.829089164733887,9607.770701408386,9598.941612243652,807.7536889577887
-5397.80615234375,41.83648490905762,9704.697260856628,9662.86077594757,440.8371218657242
-5435.19189453125,24.520596504211426,9770.095435142517,9745.574838638306,984.4880335459218
-5486.12646484375,48.09725093841553,9847.896334648132,9799.799083709717,464.3226426562266
-5199.6669921875,-68.88606822490692,9408.4505777359,9477.336645960808,445.7840780311296
-5365.87109375,10.088591814041138,9660.783883810043,9650.695291996002,1078.852500317979
-5411.1689453125,26.360897064208984,9731.29149723053,9704.93060016632,1037.9568748322151
-5502.61279296875,39.23770236968994,9877.396340370178,9838.158638000488,826.2458901905535
-5414.134765625,18.846463203430176,9736.91759109497,9718.07112789154,574.2973371333593
-5521.224609375,43.7178897857666,9907.260480880737,9863.54259109497,460.2092520058292
-5437.82373046875,0.7670698165893555,9781.982508659363,9781.215438842773,2300.287799385828
-5529.03466796875,49.72009086608887,9918.49301147461,9868.77292060852,440.58407299712957
-5350.22216796875,-30.19895526766777,9646.206599503756,9676.405554771423,947.2556661073709
-5570.2021484375,51.88243865966797,9986.654253005981,9934.771814346313,446.3855775599361
-5486.7890625,18.77126693725586,9857.992197036743,9839.220930099487,1088.135979516531
-5391.13232421875,6.12007999420166,9705.22659111023,9699.106511116028,452.7624612829816
-5631.89306640625,63.92763137817383,10084.694948196411,10020.767316818237,446.1983285680916
-5446.7939453125,-1.8989696502685547,9798.031565666199,9799.930535316467,1160.0603211694556
-5505.11376953125,16.590349197387695,9889.159093856812,9872.568744659424,962.5773726182057
-5526.7060546875,17.277015686035156,9924.316809654236,9907.0397939682,933.0462896170246
-5457.22265625,-4.517712593078613,9815.970238685608,9820.487951278687,475.1981685830674
-5589.49658203125,44.94960403442383,10020.761553764343,9975.81194972992,825.5266503627352
-5465.84130859375,-22.78378200531006,9834.861841201782,9857.645623207092,1186.5652882796048
-5096.595703125,-193.58379411697388,9272.035490512848,9465.619284629822,436.1007271937173
-5565.97412109375,37.91970348358154,9984.549827575684,9946.630124092102,883.4541695117888
-5491.2197265625,27.19504165649414,9865.123211860657,9837.928170204163,550.4175545002652
-4969.26708984375,-333.0777046084404,9099.126898109913,9432.204602718353,745.1461903952984
-5300.515625,-104.3237771987915,9581.140637397766,9685.464414596558,3495.490187823306
-5265.619140625,-92.04341340065002,9524.631127595901,9616.674540996552,1760.227792323059
-5638.6376953125,63.48610973358154,10097.973666191101,10034.48755645752,850.4201640831017
-5626.7646484375,57.811946868896484,10079.515021324158,10021.703074455261,876.1446825533963
-5452.36083984375,-49.0026216506958,9820.55306816101,9869.555689811707,483.05625842499916
-5598.7265625,46.78496837615967,10037.02561378479,9990.24064540863,5060.402781370664
-5618.0322265625,49.025097370147705,10068.593249797821,10019.568152427673,433.52724918289863
-5449.04345703125,-44.011610984802246,9815.956142425537,9859.96775341034,1162.7170963533383
-5652.25537109375,47.99098205566406,10125.095116615295,10077.104134559631,548.5318404740348
-5581.6298828125,25.137248039245605,10014.682064056396,9989.54481601715,1203.3596560845708
-5459.50830078125,-13.027465462684631,9825.31294953823,9838.340415000916,757.4499472298519
-5588.01025390625,14.279831886291504,10028.250394821167,10013.970562934875,1187.5888061398052
-5706.84619140625,52.33957481384277,10213.854843139648,10161.515268325806,878.6434614031151
-5550.14404296875,-13.878464460372925,9973.965968370438,9987.84443283081,1226.4500739309765
-5460.1513671875,-6.100975394248962,9823.474564671516,9829.575540065765,932.6289810268087
-5586.6943359375,7.654675483703613,10028.765962600708,10021.111287117004,1019.811999445655
-5637.43798828125,29.0369291305542,10106.21607208252,10077.179142951965,430.9649434318984
-5767.15625,70.03887844085693,10310.0132522583,10239.974373817444,833.8892180312753
-5319.36962890625,-173.70510387420654,9635.840037345886,9809.545141220093,840.8554270007563
-5727.82958984375,73.99066162109375,10243.993669509888,10170.003007888794,833.0881846369601
-5627.76171875,33.33688259124756,10090.115623474121,10056.778740882874,911.6139735812545
-4898.41357421875,-304.2530227303505,8978.09954303503,9282.35256576538,872.8041494924723
-5753.9951171875,87.39065361022949,10283.725191116333,10196.334537506104,1876.3314988836087
-5510.6796875,-36.43599462509155,9915.949533939362,9952.385528564453,843.6557279043016
-5395.23046875,-83.52179163694382,9738.741209328175,9822.263000965118,740.1338191070936
-5660.19970703125,28.136878967285156,10145.478667259216,10117.341788291931,429.29877187800037
-5624.7080078125,-0.05574464797973633,10093.736055850983,10093.791800498962,928.3976053659699
-5758.27978515625,47.93224620819092,10300.817353248596,10252.885107040405,964.592542457312
-5424.45458984375,-74.82687073945999,9785.038038611412,9859.864909350872,479.18581275662444
-5812.54052734375,83.79934501647949,10380.757801055908,10296.958456039429,733.2489476275439
-5698.3623046875,43.92059659957886,10204.32028913498,10160.3996925354,906.7325134574598
-5729.69189453125,23.21140956878662,10259.798670768738,10236.587261199951,885.5965015356358
-5348.93212890625,-97.70544266700745,9666.806833744049,9764.512276411057,985.0546661888421
-5801.04443359375,53.80018901824951,10370.723517417908,10316.923328399658,1245.4778655674509
-5264.26123046875,-232.46741330623627,9559.90811252594,9792.375525832176,949.9090628213904
-5553.1416015625,-38.0296991802752,9987.49283137545,10025.522530555725,832.3130605323654
-5870.36279296875,77.74201583862305,10477.907001495361,10400.164985656738,801.0524763158903
-5541.07568359375,-36.40861940383911,9966.613119125366,10003.021738529205,851.2814769896736
-5799.27197265625,48.04938507080078,10369.449014663696,10321.399629592896,1218.9531923917875
-5878.994140625,81.85739231109619,10491.03563785553,10409.178245544434,914.8744911595583
-5312.02587890625,-296.0769639015198,9653.084661960602,9949.161625862122,768.9931587785293
-5614.203125,-35.13229417800903,10087.030187129974,10122.162481307983,485.53175318436723
-5915.95361328125,82.76346588134766,10551.654172897339,10468.890707015991,928.1316959182335
-5739.294921875,24.74181878566742,10277.010070681572,10252.268251895905,943.2890180864125
-5771.00341796875,19.840797424316406,10330.03584098816,10310.195043563843,831.7357694817103
-5801.67431640625,34.98681831359863,10377.85465335846,10342.86783504486,1281.8625142168498
-5668.734375,-27.135798454284668,10174.457800865173,10201.593599319458,867.2316157942932
-5663.81298828125,-53.10661119222641,10178.305215895176,10231.411827087402,744.6301821551671
-5402.50390625,-93.68619728088379,9750.202193260193,9843.888390541077,751.1433853642449
-5843.68896484375,52.07919406890869,10441.7026720047,10389.623477935791,1098.374117908882
-5895.78125,78.31698799133301,10521.28839302063,10442.971405029297,760.5947850182125
-5656.857421875,-50.86499881744385,10161.226315498352,10212.091314315796,829.8670914667227
-5772.87939453125,14.424654006958008,10335.772472381592,10321.347818374634,965.0750833489368
-5795.49609375,14.846879005432129,10372.224618911743,10357.377739906311,911.9267683496153
-5564.873046875,-76.47458362579346,10017.600466012955,10094.075049638748,2433.1143464296597
-5678.5400390625,-42.45507571101189,10195.240637809038,10237.69571352005,1183.5273014269321
-5737.89013671875,12.09720253944397,10279.609533548355,10267.512331008911,818.0282913141384
-5828.4912109375,34.05400466918945,10422.397819519043,10388.343814849854,778.8795293839369
-5785.09912109375,-7.839487552642822,10361.502809047699,10369.342296600342,885.9677396263542
-5779.66845703125,19.512282371520996,10347.504499435425,10327.992217063904,816.1726940632228
-5818.09814453125,-4.345409870147705,10414.737082958221,10419.08249282837,724.239553101372
-5952.470703125,78.3162488937378,10614.138297080994,10535.822048187256,749.7815604124173
-5512.34521484375,-188.86142587661743,9959.673877239227,10148.535303115845,773.7038286196752
-5755.59619140625,-16.811033248901367,10317.082982063293,10333.894015312195,882.2535548029642
-5850.19873046875,46.43654727935791,10455.332405090332,10408.895857810974,1164.2188739167652
-5512.806640625,-238.48745107650757,9975.450207710266,10213.937658786774,927.7477691588856
-5872.22509765625,38.28154993057251,10494.409937381744,10456.128387451172,872.8353230729809
-5840.181640625,13.791069030761719,10447.883373260498,10434.092304229736,719.7037884181045
-5645.81298828125,-65.23047876358032,10149.685834407806,10214.916313171387,735.5499192120798
-5705.46826171875,-18.46389865875244,10233.59201335907,10252.055912017822,838.703476098014
-5800.7861328125,-32.886616706848145,10395.251322746277,10428.137939453125,744.2444045424152
-5756.07275390625,-8.969836950302124,10316.488921880722,10325.458758831024,938.9107814378484
-5971.13720703125,65.7421350479126,10649.963507652283,10584.22137260437,742.1850239629083
-5974.21826171875,57.08238124847412,10656.551325798035,10599.46894454956,955.4428569465603
-5293.0244140625,-267.8737351298332,9625.453723728657,9893.32745885849,819.9534938049746
-5902.84765625,63.97309112548828,10538.58456325531,10474.611472129822,1424.4620231144736
-5705.693359375,-145.2383280992508,10264.513615965843,10409.751944065094,803.4181579211449
-5907.1708984375,38.65189743041992,10552.853436470032,10514.201539039612,1030.7263955715098
-5631.7216796875,-68.26184010505676,10128.004595041275,10196.266435146332,760.8072847779941
-5667.65283203125,-71.52182602882385,10188.221479177475,10259.743305206299,941.6452893576449
