loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,2.452721083573823
-12584.0,809.3853677362204,4383.246488362551,3573.8611206263304,432.9732447580795
-17047.400390625,143.06625938415527,5897.751709938049,5754.685450553894,1060.0123872958668
-18310.703125,80.47733306884766,6320.263480186462,6239.786147117615,2641.1364195951846
-19041.232421875,60.378201484680176,6563.593058586121,6503.21485710144,1125.4383671384423
-19899.259765625,69.24875068664551,6845.7664976119995,6776.517746925354,1511.1321608546755
-20420.8828125,69.49515342712402,7018.038170814514,6948.54301738739,1971.1349948851034
-20938.951171875,71.06113815307617,7189.353427886963,7118.292289733887,872.8562802179282
-21279.177734375,70.6083345413208,7302.8020095825195,7232.193675041199,713.1931106326397
-21470.724609375,45.16509532928467,7369.139025211334,7323.97392988205,6708.019344912567
-22016.783203125,69.00729179382324,7547.17893409729,7478.171642303467,2432.7201023616344
-22087.115234375,44.131211280822754,7573.653314590454,7529.522103309631,1646.5353305137382
-22449.765625,54.86857318878174,7693.188789367676,7638.320216178894,1847.581021899855
-22523.6875,39.360671043395996,7719.399586677551,7680.038915634155,764.87423041205
-22938.587890625,40.43770408630371,7856.488221168518,7816.050517082214,2063.9597813931755
-23121.041015625,36.94710063934326,7917.871660232544,7880.924559593201,1231.3776647517534
-23307.880859375,39.32440757751465,7979.576442718506,7940.252035140991,1923.9630111878926
-23071.841796875,21.04235553741455,7904.10138130188,7883.059025764465,1062.2975769292857
-23435.849609375,5.651988983154297,8026.216044425964,8020.56405544281,652.1033459332724
-23775.505859375,37.497039794921875,8135.16749382019,8097.670454025269,903.6984875636809
-24018.318359375,25.624653816223145,8217.010705947876,8191.386052131653,2276.78054722338
-24157.84375,21.401549339294434,8263.431365966797,8242.029816627502,3419.8100060720744
-23852.732421875,1.1853082180023193,8165.512650251389,8164.327342033386,1758.2172757083633
-24394.548828125,9.624345779418945,8343.213056564331,8333.588710784912,894.3709059460173
-24514.564453125,12.352907180786133,8383.264113426208,8370.911206245422,1192.8117269882032
-24532.908203125,1.7227840423583984,8390.328614234924,8388.605830192566,2610.071812418061
-24742.02734375,7.561305046081543,8459.137721061707,8451.576416015625,1529.0725284258401
-24729.4296875,-3.414017677307129,8456.335571289062,8459.74958896637,4331.601231193591
-24854.888671875,-5.813182830810547,8497.91825389862,8503.731436729431,3770.4564485924766
-25180.841796875,-3.8975915908813477,8605.826942443848,8609.724534034729,1924.9880888354282
-24842.501953125,-8.184226036071777,8494.378426551819,8502.56265258789,5555.2552507420805
-25392.94140625,-7.113127708435059,8676.060108184814,8683.17323589325,890.3001900788976
-25328.24609375,-6.898027420043945,8655.539148330688,8662.437175750732,1536.4510173096755
-25589.43359375,-6.045571327209473,8742.04880142212,8748.094372749329,1187.8796480100273
-25357.86328125,-21.67620849609375,8666.782508850098,8688.458717346191,3215.0441178389538
-25679.53125,-11.496620178222656,8772.208802223206,8783.705422401428,2413.75391256286
-25791.400390625,-9.95334243774414,8809.40179157257,8819.355134010315,2333.524303323361
-25283.80078125,-48.84258246421814,8645.817801237106,8694.660383701324,884.2262277337485
-25942.18359375,1.6534481048583984,8858.805477142334,8857.152029037476,5410.364628831945
-26248.060546875,-2.516026496887207,8960.133864402771,8962.649890899658,1316.600822610053
-25955.193359375,-14.97143840789795,8865.19219493866,8880.163633346558,1420.8437853597115
-26110.310546875,-10.920015335083008,8915.46002483368,8926.380040168762,1045.5823140137352
-26185.76953125,-26.911163330078125,8942.699723243713,8969.610886573792,1751.6272628238646
-25843.6953125,-32.51884937286377,8829.724309444427,8862.243158817291,3612.811983901896
-26375.337890625,-24.318103790283203,9004.970381736755,9029.288485527039,3639.8371859198023
-26585.134765625,-9.321550369262695,9072.760887145996,9082.082437515259,1982.8895982789836
-26417.888671875,-19.5101261138916,9018.865071296692,9038.375197410583,1916.8927961607023
-26588.521484375,-23.62311553955078,9075.844571113586,9099.467686653137,2845.1904201502102
-26724.857421875,-13.202998161315918,9119.846040725708,9133.049038887024,1951.625351519034
-26769.966796875,-17.735076904296875,9135.35606098175,9153.091137886047,3189.205663784132
-26604.20703125,-36.30729532241821,9082.63767671585,9118.944972038269,2308.5998880281154
-26839.18359375,-14.4158935546875,9157.800523757935,9172.216417312622,1506.2348205170895
-27008.62890625,-11.449992179870605,9214.155040740967,9225.605032920837,1709.7141262135274
-26968.66015625,-17.184125900268555,9201.38109588623,9218.565221786499,4064.4532549633445
-27114.25,-7.5780487060546875,9248.748987197876,9256.32703590393,840.9870621904744
-27040.685546875,-22.80245590209961,9226.135738372803,9248.938194274902,1289.6612884326555
-27274.240234375,-9.918232917785645,9302.417830467224,9312.33606338501,2771.026381140118
-27300.193359375,-21.579012870788574,9312.01441860199,9333.593431472778,2141.863866693493
-27490.41796875,-7.496973037719727,9373.112703323364,9380.609676361084,1485.08222942254
-27212.63671875,-21.46995449066162,9283.237035751343,9304.706990242004,924.8474361285316
-27362.142578125,-27.17346954345703,9333.547297477722,9360.72076702118,1599.824969614087
-27454.150390625,-12.934370040893555,9362.223477363586,9375.15784740448,864.6462778715345
-27346.7421875,-21.130852699279785,9328.34634590149,9349.477198600769,894.3888862938137
-27675.99609375,-11.273702621459961,9435.451511383057,9446.725214004517,4094.998021768149
-27509.90625,-23.14854621887207,9382.19808769226,9405.346633911133,1787.9909137886518
-27731.0859375,-5.928227424621582,9453.507830619812,9459.436058044434,5710.570202120273
-27496.849609375,-25.675798416137695,9378.284673690796,9403.960472106934,975.8062016351589
-27650.537109375,-20.817330360412598,9428.595123291016,9449.412453651428,1260.9020469520324
-27412.41015625,-39.61661434173584,9352.144240379333,9391.76085472107,1392.2414837304077
-27293.166015625,-55.14770722389221,9314.77540755272,9369.923114776611,1497.6941643337047
-27853.115234375,-8.259726524353027,9494.3794631958,9502.639189720154,3725.670422690459
-28088.98828125,-8.867088317871094,9572.470613479614,9581.337701797485,1567.5055943612012
-28012.25,-13.472156524658203,9547.505801200867,9560.977957725525,1532.5302192387192
-28162.169921875,-8.946622848510742,9597.155820846558,9606.102443695068,3976.9631702802626
-27797.404296875,-29.133268356323242,9479.01423072815,9508.147499084473,1264.8868534780995
-27571.16796875,-44.71224927902222,9405.703074932098,9450.41532421112,3339.375564205736
-27950.7890625,-31.54414653778076,9529.981559753418,9561.525706291199,1136.9253730465105
-28265.77734375,-11.336383819580078,9631.905073165894,9643.241456985474,944.3485246893144
-28344.462890625,6.462244987487793,9656.322638511658,9649.86039352417,1225.1218374508687
-28032.17578125,-37.88155460357666,9557.6948928833,9595.576447486877,1588.7458651898273
-28240.615234375,-10.548187255859375,9623.475173950195,9634.023361206055,1262.314511923868
-28320.388671875,-21.28431987762451,9651.386301994324,9672.670621871948,1664.6278315473455
-28092.423828125,-45.233309268951416,9578.412823200226,9623.646132469177,1540.6193095350502
-28306.619140625,-13.130634307861328,9646.300512313843,9659.431146621704,1016.2996032546877
-28238.849609375,-25.42270278930664,9625.138730049133,9650.56143283844,2766.632922481748
-28522.20703125,-7.977252006530762,9717.140793800354,9725.118045806885,599.8539031264685
-28545.51171875,-12.719034194946289,9725.660466194153,9738.3795003891,592.8444785873511
-28594.837890625,-24.438254356384277,9742.617327690125,9767.055582046509,670.1589386629977
-28602.919921875,-15.632097244262695,9744.754115104675,9760.386212348938,890.489555089406
-28818.994140625,-2.472200393676758,9814.70485496521,9817.177055358887,1436.2303974548968
-28528.0234375,-13.483016014099121,9720.402448654175,9733.885464668274,692.1291427741545
-28581.4921875,-14.48806381225586,9738.036724090576,9752.524787902832,981.2706025877967
-28994.00390625,-4.246309280395508,9873.007452011108,9877.253761291504,2468.9593093528374
-28422.150390625,-50.94235324859619,9688.87359046936,9739.815943717957,1014.1457712629646
-28728.67578125,-13.83774185180664,9786.759890556335,9800.597632408142,3100.8782053443856
-28611.3125,-28.751415729522705,9749.857132434845,9778.608548164368,2894.8814017007726
-28942.203125,1.9298095703125,9855.467063903809,9853.537254333496,418.29241995768615
-28977.9453125,-8.096734046936035,9868.237781524658,9876.334515571594,686.4505040070086
-28709.9765625,-22.450751304626465,9782.024399757385,9804.475151062012,864.5012536322419
-28947.37890625,-18.408037185668945,9859.566595077515,9877.974632263184,1300.2794460355483
-27384.486328125,-248.99645519256592,9367.180204868317,9616.176660060883,1118.3513371342092
-28265.4609375,-22.84173011779785,9634.590133666992,9657.43186378479,2002.1166277142124
-28804.8359375,-17.904541015625,9812.858984947205,9830.76352596283,1303.6063528380007
-29308.419921875,-2.494032859802246,9977.440331459045,9979.934364318848,1927.8007969101452
-29136.09375,-22.394237518310547,9923.32106590271,9945.71530342102,1937.958536669112
-28999.7109375,-7.986565589904785,9875.935580253601,9883.922145843506,418.8050863799422
-29160.896484375,-19.482370376586914,9930.62617111206,9950.108541488647,1239.1913417784074
-28459.640625,-77.0378155708313,9705.283036708832,9782.320852279663,1862.34710070548
-29394.765625,-6.861110687255859,10006.844087600708,10013.705198287964,1816.787576876596
-29477.845703125,-2.343751907348633,10034.037769317627,10036.381521224976,407.88810020850207
-29129.962890625,-27.849098205566406,9921.645427703857,9949.494525909424,1151.0286072426418
-29124.11328125,-23.592358589172363,9919.308046340942,9942.900404930115,1120.9547182595763
-28763.86328125,-70.36032009124756,9805.3326587677,9875.692978858948,1004.923273971408
-28872.216796875,-75.03916454315186,9841.466620445251,9916.505784988403,3788.0396540418265
-29303.3046875,-22.994604110717773,9978.714887619019,10001.709491729736,463.7591504805324
-29658.470703125,2.888826370239258,10093.670417785645,10090.781591415405,1769.3254817802942
-29427.46484375,-17.864375114440918,10018.822197914124,10036.686573028564,2233.6063661906605
-29607.705078125,-6.597629547119141,10077.562167167664,10084.159796714783,588.7876784129463
-29658.79296875,-4.369635581970215,10094.641222953796,10099.010858535767,2172.706303082502
-29528.107421875,-32.15618896484375,10054.149032592773,10086.305221557617,413.132772040289
-29618.837890625,-22.075881958007812,10083.408044815063,10105.483926773071,425.94089218079637
-29773.607421875,-3.9846696853637695,10132.781651496887,10136.766321182251,738.0808560912628
-29511.287109375,-22.110774040222168,10048.262858390808,10070.37363243103,748.8974115355667
-29834.2890625,-18.01664161682129,10154.078462600708,10172.09510421753,426.19434446302307
-29196.966796875,-72.15353393554688,9949.305691719055,10021.459225654602,854.8600977654551
-29766.8125,-9.803872108459473,10131.294988632202,10141.098860740662,412.66284299080564
-29556.82421875,-32.64520263671875,10063.948463439941,10096.59366607666,4203.561201847265
-29805.580078125,-16.111188888549805,10144.616827011108,10160.728015899658,432.94043805473086
-29664.443359375,-42.32130432128906,10100.720708847046,10143.042013168335,803.4155098077578
-29707.67578125,-29.46969509124756,10113.60625743866,10143.075952529907,452.1513399083736
-29643.205078125,-36.73603057861328,10093.142650604248,10129.878681182861,447.4748958658803
-29892.728515625,-23.88272190093994,10174.790968894958,10198.673690795898,426.8734617898968
-29749.83203125,-23.107792854309082,10127.13967514038,10150.24746799469,2568.95822505355
-29362.552734375,-62.02625513076782,10003.643367290497,10065.669622421265,2545.061821873569
-29993.1953125,-16.35307502746582,10207.06352519989,10223.416600227356,1589.134280001502
-29239.5703125,-83.1943507194519,9965.441544055939,10048.63589477539,1169.8648410452333
-29983.115234375,-12.82568359375,10203.499484062195,10216.325167655945,444.99501429193793
-30204.935546875,-7.58806037902832,10276.07731628418,10283.665376663208,494.8883625767403
-30114.23828125,-18.391942024230957,10247.598883628845,10265.990825653076,1666.1920999499578
-29886.8203125,-18.207155227661133,10172.517079353333,10190.724234580994,565.5947749575546
-29519.884765625,-64.87275314331055,10056.019605636597,10120.892358779907,1302.828331593924
-30122.904296875,-23.632801055908203,10251.28862953186,10274.921430587769,2064.699476365967
-29804.251953125,-45.14627552032471,10148.32424068451,10193.470516204834,444.22226505385777
-30254.77734375,-8.198287010192871,10293.038080215454,10301.236367225647,433.78472624093547
-30394.1171875,-5.187365531921387,10339.014681816101,10344.202047348022,419.3972228774586
-30087.021484375,-28.544054985046387,10239.871342658997,10268.415397644043,1263.0747468878437
-29344.208984375,-127.39696788787842,10004.0700674057,10131.46703529358,1032.2683661430585
-29905.03515625,-69.68024063110352,10183.927857398987,10253.60809803009,1121.4697662031463
-30504.88671875,-16.510923385620117,10377.008783340454,10393.519706726074,1828.3380817295138
-30221.904296875,-15.156318664550781,10283.670469284058,10298.826787948608,1025.7116040874635
-30364.69921875,-27.583231925964355,10331.691796302795,10359.27502822876,3691.928830445964
-29940.951171875,-44.40369415283203,10193.834058761597,10238.237752914429,746.5761964945898
-30478.44140625,-17.219971656799316,10368.90272808075,10386.122699737549,470.51454266617304
-30164.29296875,-47.2538537979126,10267.290315628052,10314.544169425964,813.2086964499307
-30429.48046875,-14.184096336364746,10352.461730003357,10366.645826339722,4942.405727928199
-29885.05859375,-77.41430759429932,10178.145330905914,10255.559638500214,1729.1132755435813
-30856.728515625,14.493293762207031,10490.601097106934,10476.107803344727,936.5840487254577
-30457.4921875,-27.094582557678223,10362.8058385849,10389.900421142578,1436.3332429536486
-30776.37109375,-7.574733734130859,10465.792472839355,10473.367206573486,2661.8879039800995
-29813.685546875,-85.38707709312439,10156.066752672195,10241.45382976532,937.0762173240487
-30549.8359375,-19.253077507019043,10392.378046035767,10411.631123542786,2419.8585772808237
-30116.1875,-64.3387531042099,10253.703503251076,10318.042256355286,1091.699155841136
-30039.595703125,-69.61544299125671,10229.140019655228,10298.755462646484,461.8548990122705
-30781.916015625,-13.028610229492188,10468.811071395874,10481.839681625366,1007.0911239596485
-30640.650390625,-28.12166404724121,10423.65920829773,10451.78087234497,801.209657742538
-29765.439453125,-92.21193182468414,10140.843990683556,10233.05592250824,5506.043590159386
-30857.529296875,-19.061174392700195,10494.44833946228,10513.50951385498,2018.3922641873437
-30176.259765625,-78.9451904296875,10275.61642742157,10354.561617851257,852.616338064501
-30707.126953125,-21.856203079223633,10445.668521881104,10467.524724960327,1568.370681783153
-31062.845703125,-19.363025665283203,10562.246032714844,10581.609058380127,1959.2544361293374
-30731.193359375,-39.574785232543945,10454.766505241394,10494.341290473938,4697.258053190673
-30577.296875,-41.36542320251465,10404.075876235962,10445.441299438477,3343.0917781144994
-30984.349609375,-21.292147636413574,10536.951170921326,10558.24331855774,2146.0535949416685
-31033.9453125,-15.301551818847656,10552.844858169556,10568.146409988403,2665.942525510282
-31079.60546875,-12.250028610229492,10567.526069641113,10579.776098251343,1017.4082326054895
-30474.7734375,-67.72352361679077,10373.62147283554,10441.344996452332,468.59016668189565
-30073.51953125,-224.9693307876587,10256.67723941803,10481.646570205688,543.5283090073171
-30925.40625,-31.115756034851074,10518.51743221283,10549.63318824768,1321.6758220769088
-31108.96875,-39.98999786376953,10580.26781463623,10620.2578125,2241.1640751344917
-30111.8203125,-156.84026956558228,10263.91213464737,10420.752404212952,1672.5759719597231
-29577.15625,-168.24409765005112,10086.614692270756,10254.858789920807,2289.368178986619
-30045.001953125,-141.03262555599213,10239.168132781982,10380.200758337975,830.9094068831756
-31323.060546875,-15.839859008789062,10648.514197349548,10664.354056358337,865.5440418861735
-31152.0859375,-27.262133598327637,10593.563906669617,10620.826040267944,436.6242870269047
-29950.14453125,-118.95321655273438,10205.507879257202,10324.461095809937,454.60121086827604
-31294.171875,-31.186473846435547,10640.781782150269,10671.968255996704,474.70689539579695
-30617.2734375,-73.55192852020264,10421.687573432922,10495.239501953125,1390.0665418593478
-30874.494140625,-53.24511194229126,10504.8506026268,10558.095714569092,948.3792703645138
-31334.568359375,-30.891623497009277,10654.416501045227,10685.308124542236,432.4229164026445
-30969.09765625,-43.20771408081055,10535.256092071533,10578.463806152344,465.58563828007544
-31295.701171875,-33.46394157409668,10641.732174873352,10675.196116447449,1295.7969878557499
-31222.88671875,-41.44495677947998,10618.023657798767,10659.468614578247,1239.7488841914683
-31535.880859375,-17.885727882385254,10719.421740531921,10737.307468414307,1041.412626829584
-30762.736328125,-91.46678161621094,10471.375095367432,10562.841876983643,811.5177916603059
-31316.720703125,-42.039085388183594,10649.557088851929,10691.596174240112,1355.8524848267186
-31161.43359375,-58.323416233062744,10600.137038707733,10658.460454940796,1261.5089140137466
-30996.37109375,-73.5323486328125,10547.346101760864,10620.878450393677,497.7546000345395
-30199.64453125,-122.29749055206776,10289.281993433833,10411.5794839859,4211.412366090449
-31029.1015625,-83.28599643707275,10558.846097946167,10642.13209438324,2195.6267211773834
-31198.529296875,-53.13227653503418,10612.248649597168,10665.380926132202,2145.0004741221037
-31131.71484375,-58.86844253540039,10590.460710525513,10649.329153060913,1300.7323754272875
