loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,2.4527208740200748
-2289.057861328125,735.4131397455931,4377.9405618608,3642.5274221152067,436.5134584562535
-3170.06396484375,54.317575454711914,5891.741215705872,5837.42364025116,1116.432233574721
-3418.548583984375,10.935270309448242,6308.398146152496,6297.462875843048,728.9883247282653
-3584.924072265625,15.227993965148926,6584.440490722656,6569.212496757507,1539.143154865744
-3746.769775390625,19.805572509765625,6852.8097496032715,6833.004177093506,916.3909642568068
-3862.69970703125,23.63623332977295,7045.149790763855,7021.513557434082,1199.51136269419
-3943.360595703125,22.366235733032227,7179.268599510193,7156.902363777161,1444.5559281771632
-4005.908935546875,28.38905906677246,7283.138882637024,7254.7498235702515,2188.6734276453
-4079.737548828125,12.262728691101074,7407.2944803237915,7395.03175163269,764.3029056739937
-4155.23388671875,16.966949462890625,7532.376742362976,7515.409792900085,1198.4343324928684
-4204.3603515625,10.908212661743164,7614.785608291626,7603.877395629883,2378.752148539417
-4236.17041015625,1.4890985488891602,7668.750018119812,7667.260919570923,2969.8115256166693
-4315.7021484375,7.060024261474609,7800.235147476196,7793.175123214722,762.3124983011397
-4370.07568359375,-0.7860250473022461,7891.340819358826,7892.126844406128,766.4352769711835
-4331.52294921875,-8.25748348236084,7828.708562850952,7836.966046333313,1867.1195285879282
-4457.1220703125,-0.5459814071655273,8036.157199859619,8036.703181266785,783.6013421092385
-4417.38037109375,-13.802155494689941,7972.093719482422,7985.895874977112,1446.782540907442
-4513.13232421875,-11.680720329284668,8130.58620262146,8142.266922950745,1862.8636877683446
-4558.47509765625,0.009730339050292969,8204.904267311096,8204.894536972046,3059.058346671783
-4563.15625,-7.450600624084473,8213.682674407959,8221.133275032043,1369.4620534979174
-4581.29345703125,-3.828549385070801,8243.545830726624,8247.374380111694,718.3562333086375
-4642.10205078125,-2.058743476867676,8344.404220581055,8346.462964057922,1510.2839935132051
-4519.9853515625,-35.946303844451904,8145.426743984222,8181.373047828674,2618.3012071129333
-4706.14208984375,-4.458614349365234,8451.206740379333,8455.665354728699,666.16972187818
-4709.6982421875,1.7190561294555664,8456.577620506287,8454.858564376831,2510.2363118638864
-4661.96240234375,-18.884041786193848,8379.586637496948,8398.470679283142,1463.6325786104414
-4738.5302734375,-6.063769340515137,8505.577408790588,8511.641178131104,332.7063819581669
-4758.52197265625,-2.5684614181518555,8538.437320709229,8541.00578212738,426.6522543247985
-4775.22119140625,-0.920654296875,8566.10004901886,8567.020703315735,1956.375775310662
-4792.48779296875,3.873424530029297,8594.362837791443,8590.489413261414,1222.0683527701929
-4813.67724609375,-7.628198623657227,8630.488247871399,8638.116446495056,2299.277593778483
-4817.43701171875,6.713556289672852,8635.698732376099,8628.985176086426,170.42255434791645
-4871.7880859375,5.495631217956543,8726.01828956604,8720.522658348083,2198.2794242817176
-4891.3974609375,6.478870391845703,8758.333702087402,8751.854831695557,1469.57235616274
-4822.990234375,-15.813825607299805,8647.290336608887,8663.104162216187,648.6947702347604
-4795.9931640625,-17.329902172088623,8603.003775119781,8620.33367729187,595.1444171205902
-4911.96435546875,3.6667890548706055,8793.199297904968,8789.532508850098,2210.1351675481
-4934.6552734375,16.751641273498535,8829.962842941284,8813.211201667786,991.8900793870074
-4938.60546875,13.186695098876953,8836.813061714172,8823.626366615295,1057.0600477458963
-4932.46435546875,6.65385627746582,8827.33485507965,8820.680998802185,2246.416883432208
-4928.849609375,4.007969856262207,8821.574949264526,8817.566979408264,1960.3705279479848
-4965.3232421875,-4.625526428222656,8883.042656898499,8887.668183326721,1217.6646283775983
-4872.67138671875,-38.49634313583374,8732.76302576065,8771.259368896484,1876.3954370565582
-5042.4091796875,17.800508499145508,9008.742418289185,8990.941909790039,1828.7323400944772
-5019.2705078125,6.4530792236328125,8971.55406665802,8965.100987434387,570.7186495573563
-5021.31396484375,12.18000602722168,8974.49975681305,8962.319750785828,1320.9029007675695
-5017.16015625,-1.1512165069580078,8969.0404920578,8970.191708564758,738.2513913531892
-5086.28857421875,19.257946968078613,9081.737221717834,9062.479274749756,1387.0932586315478
-5032.6064453125,7.678952217102051,8994.09709072113,8986.418138504028,689.4317843602865
-5050.0625,8.274189949035645,9022.806435585022,9014.532245635986,3284.4458728164636
-5078.046875,-2.0308446884155273,9070.23362159729,9072.264466285706,2191.2084497919254
-5082.546875,4.855947494506836,9077.324169158936,9072.468221664429,304.1242381536658
-5063.5654296875,-7.191044807434082,9046.874196052551,9054.065240859985,165.56779186348862
-5079.55029296875,-9.914241790771484,9074.025944709778,9083.94018650055,487.08787250434375
-5117.0166015625,11.578598022460938,9133.749987602234,9122.171389579773,166.10828613970412
-5089.30859375,5.1039719581604,9088.839741230011,9083.73576927185,162.99200663313712
-5150.11328125,-0.20670032501220703,9189.962051391602,9190.168751716614,679.0586706180843
-5144.49853515625,7.778079032897949,9179.858009338379,9172.079930305481,830.116261187103
-5168.142578125,5.686335563659668,9219.317051887512,9213.630716323853,169.03214238236484
-5185.79345703125,5.647062301635742,9248.802421569824,9243.155359268188,860.6118475371587
-5199.42529296875,6.257185935974121,9271.265732765198,9265.008546829224,161.77274185977535
-5183.853515625,3.0755348205566406,9245.82719707489,9242.751662254333,2059.148733983267
-5194.18212890625,-2.946643352508545,9263.66839838028,9266.615041732788,159.58467028042315
-5183.74365234375,5.109926223754883,9245.540890693665,9240.43096446991,3073.884885223736
-5195.94140625,2.0830955505371094,9266.156841278076,9264.073745727539,1064.7832300209704
-5089.486328125,-56.86121678352356,9095.058260202408,9151.919476985931,1421.6982977292616
-5282.44873046875,11.317462921142578,9408.777486801147,9397.460023880005,900.138072683046
-5246.58154296875,2.739511489868164,9350.245822906494,9347.506311416626,254.38199472639616
-5265.05712890625,3.690171241760254,9380.830913543701,9377.140742301941,1387.7175695511442
-5256.1220703125,-0.052824974060058594,9366.584079742432,9366.636904716492,2354.778933562071
-5310.53955078125,7.063098907470703,9456.12343788147,9449.060338973999,3194.744657687999
-5106.46142578125,-56.38640356063843,9123.404821872711,9179.79122543335,1421.2269478050118
-5284.06982421875,3.619338035583496,9412.890159606934,9409.27082157135,1121.0389161111011
-5202.4462890625,-36.660090923309326,9281.407559871674,9318.067650794983,594.2231148860913
-5310.61279296875,6.838591575622559,9456.49772644043,9449.659134864807,1177.2152851582966
-5333.599609375,10.942852973937988,9494.211115837097,9483.26826286316,1024.1128430226518
-5343.2265625,7.404916763305664,9510.408014297485,9503.00309753418,1805.707854027241
-5328.84912109375,4.4734392166137695,9487.101618766785,9482.62817955017,2127.984858862309
-5227.6162109375,-33.67327642440796,9322.685155391693,9356.358431816101,1420.9166272705986
-5296.72607421875,-6.548835754394531,9434.439440727234,9440.988276481628,164.5893401204842
-5365.7353515625,-0.4730100631713867,9548.99658203125,9549.469592094421,651.2412359822513
-5285.478515625,-20.91965562105179,9418.036264121532,9438.955919742584,1542.659215420601
-5351.14306640625,2.442194938659668,9524.386510848999,9521.94431591034,819.6442377126151
-5392.88671875,1.1232013702392578,9593.856241226196,9592.733039855957,1219.8016694910837
-5380.12890625,1.1923637390136719,9572.627316474915,9571.4349527359,631.0474737673578
-5395.3701171875,-5.516096115112305,9598.976114273071,9604.492210388184,1337.1780810324074
-5373.07080078125,-12.309924125671387,9562.254697799683,9574.564621925354,1796.296447239435
-5422.27001953125,-0.8687572479248047,9642.939770698547,9643.808527946472,1276.1059419822068
-5353.43994140625,-32.12858009338379,9531.792533874512,9563.921113967896,2322.7669006690758
-5480.328125,11.469812393188477,9738.155271530151,9726.685459136963,702.9828327410974
-5458.603515625,11.48220443725586,9702.106149673462,9690.623945236206,1569.511227183482
-5440.17724609375,-1.8764963150024414,9672.976767539978,9674.85326385498,1801.458815331849
-5471.064453125,0.9863185882568359,9723.925247192383,9722.938928604126,1932.3698979943563
-5387.01953125,-37.72040271759033,9588.302874565125,9626.023277282715,1458.2116357928294
-5424.10107421875,-20.310538291931152,9648.247283935547,9668.557822227478,2842.7033928260807
-5506.07958984375,1.8290510177612305,9781.922404289246,9780.093353271484,3400.5839744353393
-5473.24853515625,-7.581470489501953,9728.543522834778,9736.12499332428,1458.0951397195322
-5501.630859375,1.3213748931884766,9774.704969406128,9773.38359451294,1891.4208720123584
-5472.19775390625,-11.186208724975586,9727.25956439972,9738.445773124695,1159.3597517854514
-5455.703125,-26.1455717086792,9701.480075836182,9727.62564754486,533.1188213522689
-5492.5322265625,-9.284102439880371,9760.655484199524,9769.939586639404,1858.1364576101655
-5538.60205078125,6.04677677154541,9835.69803905487,9829.651262283325,1855.2111738937833
-5543.58203125,-6.194954872131348,9845.25548171997,9851.450436592102,2551.948470774071
-5421.48291015625,-56.727792501449585,9647.82049202919,9704.54828453064,2184.3002055127367
-5488.12060546875,-30.900524139404297,9755.530256271362,9786.430780410767,1362.79448812151
-5553.615234375,-4.468222618103027,9861.816743850708,9866.284966468811,1642.0245633085542
-5547.99658203125,-8.722020149230957,9853.114692687988,9861.83671283722,2805.624033526836
-5433.03857421875,-65.632080078125,9667.80347442627,9733.435554504395,765.5059505264015
-5578.1298828125,-13.780256271362305,9903.611535072327,9917.391791343689,940.6278576887607
-5533.03759765625,-21.47614860534668,9829.62557220459,9851.101720809937,656.5666058093752
-5563.62548828125,-19.58786678314209,9880.172985076904,9899.760851860046,876.5453888847235
-5629.99462890625,1.3880882263183594,9988.236320495605,9986.848232269287,1936.6672780859408
-5554.591796875,-30.36885643005371,9866.045007705688,9896.413864135742,1413.2804541840676
-5532.26806640625,-32.00023174285889,9829.580122947693,9861.580354690552,1467.4685221854886
-5649.220703125,7.309877395629883,10019.825681686401,10012.515804290771,1769.8501929066074
-5462.345703125,-98.65091156959534,9720.044018030167,9818.694929599762,1090.9366675588992
-5552.2763671875,-26.46109962463379,9862.02340888977,9888.484508514404,1025.0190115399805
-5593.41162109375,-31.76084852218628,9931.153213977814,9962.9140625,521.7471849316116
-5614.529296875,-33.25700092315674,9965.967573165894,9999.22457408905,2219.7886013149746
-5651.01416015625,-12.206921577453613,10024.974401473999,10037.181323051453,979.1221462082422
-5606.8916015625,-40.394208908081055,9954.096934318542,9994.491143226624,2602.966010901361
-5627.1298828125,-20.54589080810547,9986.216724395752,10006.762615203857,552.5064028867931
-5527.1806640625,-73.2930817604065,9825.303019046783,9898.59610080719,979.8967056577495
-5447.3955078125,-100.6492977142334,9695.935269355774,9796.584567070007,1102.1551632821106
-5668.02587890625,-16.524703979492188,10053.788826942444,10070.313530921936,1378.8696296786186
-5683.21435546875,-16.754494667053223,10078.812390327454,10095.566884994507,1360.1307076446992
-5670.7783203125,-20.147493362426758,10058.405698776245,10078.553192138672,3465.263832749373
-5691.07861328125,-22.932979583740234,10092.406025886536,10115.339005470276,1891.7429406193203
-5634.29248046875,-37.86819362640381,9999.464150428772,10037.332344055176,726.523140114441
-5716.92138671875,-17.884702682495117,10134.753135681152,10152.637838363647,823.8051030693866
-5595.2421875,-64.5472960472107,9937.622004032135,10002.169300079346,1625.4305401796364
-5653.48486328125,-39.065168380737305,10031.61455821991,10070.679726600647,1053.4411884770748
-5604.7587890625,-84.00879144668579,9955.67964887619,10039.688440322876,702.6281049355937
-5692.48681640625,-43.75122356414795,10096.645809173584,10140.397032737732,1810.2106993442703
-5660.84423828125,-52.645079612731934,10045.35332775116,10097.998407363892,1561.13239465542
-5753.826171875,-14.33665657043457,10195.99048423767,10210.327140808105,895.1473065553802
-5762.07421875,-18.04003143310547,10209.864835739136,10227.904867172241,3121.9504211585136
-5784.3525390625,-15.020634651184082,10246.704953193665,10261.725587844849,1949.1527949416957
-5690.32861328125,-38.25651931762695,10093.309837341309,10131.566356658936,1943.357730371955
-5666.44482421875,-60.80009078979492,10055.749272346497,10116.549363136292,3677.7961107019028
-5693.00390625,-66.35341477394104,10100.792776823044,10167.146191596985,808.5194423233852
-5735.08740234375,-27.028265953063965,10166.111695289612,10193.139961242676,1242.2958865917465
-5725.98193359375,-47.50604963302612,10153.109602451324,10200.61565208435,1538.1594699649515
-5815.74072265625,-12.640758514404297,10298.720373153687,10311.36113166809,839.9609050801296
-5794.5791015625,-24.94135284423828,10264.846304893494,10289.787657737732,1348.0178863529081
-5777.04296875,-34.55328559875488,10236.698518753052,10271.251804351807,2051.425777665212
-5783.28955078125,-38.047593116760254,10247.419375419617,10285.466968536377,2711.5218451432233
-5812.2451171875,-24.017192840576172,10293.99691772461,10318.014110565186,3014.5493625141526
-5646.56787109375,-120.3538167476654,10028.53984951973,10148.893666267395,876.8418612293369
-5679.23193359375,-61.45777362585068,10077.696220934391,10139.153994560242,2673.8189529401557
-5875.1767578125,-14.713541030883789,10397.683990478516,10412.3975315094,1538.3297223874222
-5802.19677734375,-37.92785358428955,10278.822226524353,10316.750080108643,1515.422509525497
-5787.6171875,-59.74339532852173,10257.618404865265,10317.361800193787,1325.065852188703
-5638.9404296875,-89.95920276641846,10012.774377822876,10102.733580589294,1956.2251610233516
-5785.71240234375,-53.075663566589355,10253.57806968689,10306.653733253479,1932.746551281283
-5742.63427734375,-33.903923988342285,10179.92563533783,10213.829559326172,1859.5964557069149
-5820.92626953125,-44.07267665863037,10310.805253982544,10354.877930641174,2609.089116748605
-5799.68896484375,-47.85250759124756,10275.766300201416,10323.618807792664,1039.92954218605
-5882.98486328125,-18.443967819213867,10411.104496002197,10429.548463821411,948.0349253571219
-5743.77197265625,-70.59337615966797,10185.49025440216,10256.083630561829,580.3647739031393
-5882.08984375,-34.742323875427246,10411.243344306946,10445.985668182373,2068.4901473363666
-5845.25830078125,-38.79285430908203,10350.507277488708,10389.30013179779,2364.8168702643475
-5818.3740234375,-49.90701675415039,10306.86925125122,10356.776268005371,1772.7315186912526
-5769.94091796875,-76.23588848114014,10229.388272285461,10305.624160766602,1781.2729934882948
-5672.3642578125,-93.91999018192291,10069.218559265137,10163.13854944706,1320.6298540028577
-5844.7939453125,-39.67259407043457,10350.162097930908,10389.834692001343,2241.567123839623
-5918.8857421875,-27.16162872314453,10471.712434768677,10498.874063491821,1877.943716453472
-5819.35791015625,-65.00035095214844,10310.629658699036,10375.630009651184,1368.245889532419
-5827.73779296875,-68.2063217163086,10324.562915802002,10392.76923751831,819.0276938647736
-5859.00830078125,-53.799116134643555,10375.10176372528,10428.900879859924,1191.7730598985142
-5844.73779296875,-70.21239185333252,10353.126182556152,10423.338574409485,2562.6781118330305
-5834.09130859375,-60.8516902923584,10334.270260810852,10395.12195110321,1783.4583518487946
-5901.138671875,-47.29617786407471,10444.262766838074,10491.558944702148,1789.0965703034867
-5830.5771484375,-65.45787954330444,10329.366586208344,10394.824465751648,1581.7036210768379
-5968.38671875,-24.70391082763672,10553.880401611328,10578.584312438965,800.0928986662143
-5849.6845703125,-64.76929664611816,10360.76240348816,10425.531700134277,1039.4073531044537
-5935.58935546875,-30.18012237548828,10500.099187850952,10530.27931022644,1671.890090035333
-5744.06640625,-110.43216443061829,10189.772182226181,10300.2043466568,1662.8752673115139
-5973.0517578125,-29.29898452758789,10562.389980316162,10591.68896484375,1148.671932783471
-5880.7626953125,-66.24572086334229,10412.823677062988,10479.06939792633,2246.3521601130215
-5952.22900390625,-29.44148063659668,10527.662754058838,10557.104234695435,1547.7998655463489
-5946.716796875,-48.71825695037842,10520.30537700653,10569.02363395691,1591.600655273793
-5953.7255859375,-47.9461145401001,10531.947226524353,10579.893341064453,1312.7882574052728
-5756.53271484375,-144.43942260742188,10214.094420433044,10358.533843040466,2016.2934874513821
-5967.0595703125,-32.06704616546631,10552.438382148743,10584.505428314209,1690.9366118583105
-5975.3291015625,-38.04497718811035,10566.903537750244,10604.948514938354,2449.7024944544123
-5803.35693359375,-103.15308976173401,10288.006380796432,10391.159470558167,636.1191043558904
-5921.6630859375,-60.545610427856445,10480.696024894714,10541.24163532257,4118.57746631712
-5940.490234375,-62.69797992706299,10511.639380455017,10574.33736038208,853.3855194540654
-5600.58984375,-209.84305691719055,9961.889704465866,10171.732761383057,1661.5096040724964
-6006.072265625,-45.4522762298584,10618.706754684448,10664.159030914307,1227.3933778723742
-5903.2138671875,-93.97397565841675,10452.568710803986,10546.542686462402,2215.8510286017445
-5988.56201171875,-33.503366470336914,10588.939645767212,10622.443012237549,1483.2080684801115
-6003.54931640625,-38.501078605651855,10613.746807098389,10652.24788570404,1126.3841429444649
-5892.29248046875,-101.74418354034424,10435.13507938385,10536.879262924194,1181.016696218587
-5985.31201171875,-50.51836013793945,10584.915958404541,10635.43431854248,1365.4710277674696
-6002.2353515625,-45.49952697753906,10612.563446998596,10658.062973976135,2609.914153646535
-5949.5556640625,-78.92637157440186,10528.315265655518,10607.24163722992,1538.3609492009696
-6009.73681640625,-38.67994785308838,10624.517708778381,10663.19765663147,1098.5399886633672
-5996.1787109375,-54.19161033630371,10603.499118804932,10657.690729141235,2435.858468078305
