loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,2.4767798995497308
-1328.5927734375,736.0476160794497,4164.092012822628,3428.0443967431784,1267.780209355195
-1937.2001953125,56.92002296447754,5752.703833580017,5695.78381061554,1010.4694074015097
-2133.927978515625,39.82307720184326,6243.525656700134,6203.702579498291,1139.0315119616487
-2247.54541015625,51.539673805236816,6524.871867179871,6473.332193374634,1671.1661461111432
-2313.943115234375,49.341264724731445,6690.904183387756,6641.562918663025,1744.1708782503192
-2397.43115234375,51.57337951660156,6898.315353393555,6846.741973876953,603.2959363537083
-2451.294189453125,41.44064140319824,7033.895336151123,6992.454694747925,589.5865953120716
-2498.565673828125,30.674168586730957,7153.005222320557,7122.331053733826,596.4147398436733
-2545.586181640625,0.7838735580444336,7274.16114616394,7273.377272605896,569.3356271745071
-2493.000244140625,-43.168370485305786,7150.533642292023,7193.7020127773285,567.8186232642365
-2605.9443359375,-7.79283332824707,7425.65155506134,7433.444388389587,3575.900775201331
-2644.873046875,-26.47282886505127,7525.459906578064,7551.932735443115,1093.5179861958004
-2704.9853515625,-34.21165180206299,7676.053945541382,7710.265597343445,346.18995506200537
-2730.598388671875,-51.66679763793945,7742.144380569458,7793.8111782073975,1701.787445835344
-2735.73486328125,-62.71615123748779,7757.008893966675,7819.725045204163,586.6583184248944
-2749.158935546875,-59.98359727859497,7790.556743144989,7850.540340423584,1471.9387980576303
-2808.052001953125,-64.0737419128418,7937.309489250183,8001.383231163025,1457.607481313051
-2795.5986328125,-81.97180843353271,7909.467998504639,7991.439806938171,3084.970436370377
-2856.351806640625,-73.42287349700928,8058.827144622803,8132.250018119812,1286.5100036164488
-2848.392578125,-81.98951721191406,8040.799395561218,8122.788912773132,569.8716030473037
-2871.55615234375,-83.94162178039551,8098.857368469238,8182.798990249634,2418.7797516259466
-2907.72509765625,-74.7063398361206,8187.426977157593,8262.133316993713,2165.82474495971
-2905.80810546875,-91.52459907531738,8185.430758476257,8276.955357551575,1235.1076445372325
-2941.254150390625,-81.42344188690186,8271.758742332458,8353.18218421936,466.461425923433
-2956.687744140625,-90.03823566436768,8311.55462360382,8401.592859268188,433.54819907927754
-2908.83935546875,-106.3986325263977,8195.450055599213,8301.84868812561,996.3225902254517
-3000.939208984375,-83.63538932800293,8420.786491394043,8504.421880722046,457.2464582896318
-3003.45361328125,-94.02458190917969,8428.378964424133,8522.403546333313,2344.609007408251
-2975.3671875,-108.45092010498047,8361.401838302612,8469.852758407593,424.05451606316507
-2987.40869140625,-115.04301500320435,8392.333617687225,8507.37663269043,1074.4247147700582
-3046.71435546875,-86.96570301055908,8535.395574569702,8622.361277580261,1110.2586187316774
-3040.042236328125,-92.95988845825195,8519.736039161682,8612.695927619934,441.6466842595627
-3055.7373046875,-99.63823223114014,8560.194658279419,8659.832890510559,450.32194260686043
-3053.373779296875,-102.37752437591553,8554.640970230103,8657.018494606018,963.2549772366108
-3046.761474609375,-110.94913005828857,8539.660999298096,8650.610129356384,2478.241936454221
-3104.130126953125,-91.75896739959717,8679.515356063843,8771.27432346344,1880.8808795701257
-3085.5244140625,-109.47887802124023,8635.656626701355,8745.135504722595,468.41651440862114
-3081.410400390625,-107.25499153137207,8625.380411148071,8732.635402679443,461.659693718927
-3122.683837890625,-101.50981616973877,8727.381616592407,8828.891432762146,1178.8501844390046
-3139.114990234375,-99.51523494720459,8767.674593925476,8867.18982887268,1985.9001364394103
-3143.126708984375,-102.93132877349854,8778.377880096436,8881.309208869934,1732.9551510990877
-3151.775390625,-111.59463882446289,8800.884461402893,8912.479100227356,1608.8521541964712
-3150.414794921875,-112.43156242370605,8798.045050621033,8910.476613044739,1647.4006938113846
-3197.882080078125,-97.75055408477783,8913.755751609802,9011.50630569458,1218.0569304035519
-3198.321044921875,-98.42592430114746,8915.377781867981,9013.803706169128,1046.7254920967694
-3205.822998046875,-96.94552040100098,8933.72773551941,9030.67325592041,457.45797956516105
-3195.7900390625,-115.51133060455322,8911.390608787537,9026.90193939209,2328.435646070425
-3205.899658203125,-117.63759422302246,8937.006705284119,9054.644299507141,459.424742045655
-3214.67529296875,-99.35234451293945,8956.533354759216,9055.885699272156,1440.0408073192216
-3215.535400390625,-113.72395038604736,8960.827410697937,9074.551361083984,1191.6023507138857
-3208.749755859375,-120.56156635284424,8944.915858268738,9065.477424621582,561.8455520391361
-3238.766845703125,-125.70376062393188,9020.31072473526,9146.014485359192,463.38788220855287
-3221.85400390625,-122.03393363952637,8977.4935464859,9099.527480125427,977.6791761676133
-3266.40478515625,-105.1709623336792,9086.269080162048,9191.440042495728,1272.1371276395905
-3295.951416015625,-101.99001121520996,9159.15585899353,9261.14587020874,1263.0257621594067
-3296.65869140625,-99.46323013305664,9160.712070465088,9260.175300598145,1318.8877326333366
-3214.5361328125,-144.66614055633545,8963.454699516296,9108.120840072632,1892.9152345205512
-3239.6650390625,-146.9429211616516,9026.415604114532,9173.358525276184,2507.6196476385003
-3266.495849609375,-144.06952714920044,9091.961218357086,9236.030745506287,1742.1842565903862
-3339.747314453125,-103.16304779052734,9268.209741592407,9371.372789382935,949.8569695985084
-3309.510498046875,-112.58780860900879,9194.988412857056,9307.576221466064,2648.4022109870875
-3295.10009765625,-126.73443222045898,9161.130071640015,9287.864503860474,1179.4557384307484
-3325.156982421875,-118.4483003616333,9234.516282081604,9352.964582443237,2854.8881100053677
-3354.973876953125,-108.82399940490723,9307.230289459229,9416.054288864136,1112.45948857471
-3338.828125,-119.61812019348145,9268.730785369873,9388.348905563354,458.66712743183564
-3344.38818359375,-122.01087665557861,9283.184255599976,9405.195132255554,1190.3004667053608
-3260.452392578125,-171.57991361618042,9082.381144046783,9253.961057662964,1060.1112833991194
-3293.602783203125,-172.73143887519836,9164.152964353561,9336.88440322876,1197.0347208925507
-3370.5126953125,-114.92044925689697,9347.304100990295,9462.224550247192,2347.120815103433
-3402.18701171875,-112.39535522460938,9425.67822265625,9538.07357788086,1519.1634056525652
-3330.264404296875,-129.87232780456543,9249.595610618591,9379.467938423157,1269.048468130059
-3384.804443359375,-116.97760105133057,9383.368420600891,9500.346021652222,1170.9585305103176
-3296.54248046875,-163.74610996246338,9170.554411888123,9334.300521850586,1060.1571368526136
-3419.032958984375,-110.79201412200928,9467.664649009705,9578.456663131714,1203.8316436579553
-3432.58837890625,-111.55427074432373,9501.34771823883,9612.901988983154,1194.4130693370869
-3417.35009765625,-121.64572811126709,9464.790398597717,9586.436126708984,438.2458891155322
-3398.3388671875,-116.52985382080078,9417.11494064331,9533.644794464111,1091.731076868598
-3316.05322265625,-183.52852773666382,9222.43311047554,9405.961638212204,1176.7160283397566
-3396.52099609375,-132.302339553833,9414.733156204224,9547.035495758057,1174.2831601689436
-3438.53369140625,-115.62790489196777,9517.338611602783,9632.966516494751,1221.2778730907219
-3418.3515625,-127.06787967681885,9468.546357154846,9595.614236831665,912.5367812385223
-3274.909423828125,-201.11768281459808,9123.688762664795,9324.806445479393,888.4364123285446
-3443.195068359375,-134.7691307067871,9531.490324020386,9666.259454727173,1168.7285851015884
-3429.09765625,-113.09735774993896,9493.821653366089,9606.919011116028,939.2169193248425
-3465.296630859375,-111.65521621704102,9583.444431304932,9695.099647521973,1059.264685741037
-3477.1455078125,-118.19614028930664,9613.539785385132,9731.735925674438,899.6512928593022
-3436.75439453125,-128.44363498687744,9514.761033058167,9643.204668045044,1069.8022953683544
-3411.75439453125,-153.61051654815674,9456.78607749939,9610.396594047546,1550.3066138103275
-3487.98828125,-115.45029640197754,9640.64255619049,9756.092852592468,1048.4454252417872
-3444.842041015625,-147.65826892852783,9537.866244316101,9685.524513244629,1632.25881556289
-3478.88232421875,-128.07471561431885,9619.672907829285,9747.747623443604,421.78093483448055
-3493.877197265625,-113.66721725463867,9655.4261636734,9769.09338092804,4128.013655693861
-3407.783447265625,-175.46865892410278,9450.083225727081,9625.551884651184,1029.8274489506016
-3518.114501953125,-104.83084964752197,9714.080027580261,9818.910877227783,1141.7940082427253
-3502.767333984375,-129.3652219772339,9679.24931049347,9808.614532470703,861.7167693699606
-3489.681396484375,-141.33968830108643,9648.721903800964,9790.06159210205,456.19293760846784
-3506.90625,-123.6874418258667,9689.163577079773,9812.85101890564,1031.1343512265817
-3445.993408203125,-160.58821058273315,9543.017969608307,9703.60618019104,3389.0864204917084
-3460.888427734375,-163.88033866882324,9580.443832397461,9744.324171066284,3094.68387820567
-3502.81201171875,-143.26893615722656,9681.78501033783,9825.053946495056,1224.2436288523231
-3547.03369140625,-116.49586009979248,9787.972130775452,9904.467990875244,1171.753426535502
-3504.986328125,-139.8541717529297,9686.640147209167,9826.494318962097,1201.159646693652
-3557.760498046875,-122.540940284729,9815.390440940857,9937.931381225586,1250.8827679224448
-3527.421875,-131.45397424697876,9741.449747562408,9872.903721809387,438.8992909737328
-3531.653076171875,-130.64095211029053,9751.732015609741,9882.372967720032,3251.1428101165684
-3568.650634765625,-118.86416053771973,9842.121118545532,9960.985279083252,1321.6790940257383
-3554.333740234375,-130.0587158203125,9808.270380020142,9938.329095840454,891.7801719608138
-3548.728759765625,-142.5938262939453,9795.986790657043,9938.580616950989,890.4984767210389
-3580.5439453125,-112.86278629302979,9871.036267280579,9983.899053573608,3892.8795553487553
-3502.6943359375,-164.72596836090088,9684.971140861511,9849.697109222412,1300.5907713012543
-3570.569091796875,-135.9539623260498,9849.454116821289,9985.408079147339,894.6127595281417
-3577.31396484375,-122.29475498199463,9864.719628334045,9987.01438331604,852.9564160983796
-3520.50634765625,-185.15244150161743,9732.680760860443,9917.83320236206,1153.549662077587
-3547.093505859375,-130.07623481750488,9790.603395462036,9920.679630279541,1248.0452477242573
-3536.992919921875,-164.44225311279297,9770.498184204102,9934.940437316895,487.8506172126949
-3613.31787109375,-119.2789945602417,9953.609504699707,10072.888499259949,1115.0473104631424
-3595.597900390625,-123.0797348022461,9910.460678100586,10033.540412902832,1905.4033348627313
-3580.48779296875,-140.62306213378906,9875.33265209198,10015.955714225769,2968.5693402913616
-3549.8857421875,-166.293221950531,9802.575825214386,9968.869047164917,1442.329876501284
-3625.823974609375,-124.76516723632812,9985.462663650513,10110.22783088684,1115.014002015587
-3617.8056640625,-122.81910800933838,9965.441792488098,10088.260900497437,2187.8179447350885
-3646.0546875,-125.28987121582031,10035.722524642944,10161.012395858765,1084.8934957245135
-3445.072509765625,-241.77964434027672,9553.750790268183,9795.53043460846,1139.8841379497194
-3614.021484375,-129.02418899536133,9957.356758117676,10086.380947113037,996.2088981235597
-3646.22021484375,-121.19481182098389,10035.797514915466,10156.99232673645,477.7268738107675
-3619.04931640625,-133.02639389038086,9970.442420959473,10103.468814849854,983.2057177166134
-3137.69775390625,-579.2114713191986,8838.80986046791,9418.02133178711,1716.473137625404
-3545.72412109375,-155.72103929519653,9792.1174492836,9947.838488578796,2498.2579889604945
-3611.7099609375,-145.99455070495605,9954.079691886902,10100.074242591858,1026.9712793925703
-3664.313720703125,-125.54425430297852,10081.509759902954,10207.054014205933,460.8492792902879
-3429.203857421875,-345.95304012298584,9528.736420631409,9874.689460754395,1026.4671072422025
-3662.9423828125,-112.3232889175415,10076.685612678528,10189.00890159607,1211.0004498683888
-3664.982666015625,-122.7861909866333,10083.202847480774,10205.989038467407,2194.567059259008
-3585.727783203125,-160.22573804855347,9892.042234897614,10052.267972946167,1148.440530208025
-3683.337890625,-116.17380046844482,10127.625906944275,10243.79970741272,2974.5511846273107
-3680.57666015625,-114.8584508895874,10120.965752601624,10235.824203491211,1210.0818585458053
-3604.48095703125,-166.13754320144653,9939.147032260895,10105.284575462341,3367.6842550253414
-3607.883544921875,-164.1620855331421,9947.791221618652,10111.953307151794,1371.6951005719975
-3638.38330078125,-155.5564579963684,10022.142830371857,10177.699288368225,954.9253897741837
-3540.906494140625,-225.89451026916504,9789.961745262146,10015.856255531311,2110.0304334086813
-3672.205322265625,-134.8309097290039,10103.078981399536,10237.90989112854,1032.2223709502741
-3617.70361328125,-190.15884113311768,9975.636759757996,10165.795600891113,1044.434930188004
-3658.64892578125,-136.57556438446045,10069.91631603241,10206.49188041687,1991.0794220847258
-3680.95068359375,-135.27792930603027,10125.079946517944,10260.357875823975,2226.2857183090787
-3618.1220703125,-205.23322582244873,9979.052694320679,10184.285920143127,1056.5311148637047
-3623.51708984375,-178.0320806503296,9988.972386360168,10167.004467010498,502.43051006053116
-3684.32177734375,-131.98942184448242,10132.879285812378,10264.86870765686,2748.601033855256
-3643.133544921875,-146.39463710784912,10032.64370059967,10179.03833770752,1019.0353036216892
-3632.893310546875,-158.82653069496155,10009.188211679459,10168.01474237442,1041.5774911846738
-3722.773681640625,-125.53477382659912,10227.660155296326,10353.194929122925,1528.3056621179076
-3737.567138671875,-112.54437255859375,10262.84786605835,10375.392238616943,1176.4507873540203
-3453.663330078125,-477.1344813108444,9607.221994519234,10084.356475830078,2907.31508791861
-3488.89404296875,-287.4166415631771,9670.390850543976,9957.807492107153,894.3084952904629
-3628.896484375,-164.0828231871128,10000.696222871542,10164.779046058655,1053.565344363421
-3593.987548828125,-241.85431098937988,9924.903225898743,10166.757536888123,1034.7095266639997
-3612.708251953125,-217.63544368743896,9967.42400932312,10185.059453010559,928.7191479258424
-3669.90771484375,-139.70412683486938,10099.322155475616,10239.026282310486,1098.5865277850999
-3738.564453125,-96.34811687469482,10263.357814788818,10359.705931663513,1201.5532853051159
-3714.196044921875,-143.63797092437744,10209.140532493591,10352.778503417969,2126.6408298410597
-3754.068359375,-101.44930076599121,10302.539337158203,10403.988637924194,2321.9635103329565
-3734.968994140625,-132.38484954833984,10259.122678756714,10391.507528305054,1222.76965630834
-3665.86328125,-177.4028844833374,10094.814752578735,10272.217637062073,1011.2660531717755
-3686.462158203125,-139.6735029220581,10140.184840202332,10279.85834312439,1496.11627935102
-3685.900390625,-141.08745956420898,10139.278680801392,10280.3661403656,1132.990876622779
-3789.34814453125,-117.28544425964355,10392.450178146362,10509.735622406006,1021.8025610808855
-3748.556640625,-123.56217098236084,10291.97791481018,10415.540085792542,447.4566822641887
-3770.90087890625,-125.99027729034424,10348.294903755188,10474.285181045532,1497.6263032106926
-3543.515869140625,-255.2047061920166,9802.391435623169,10057.596141815186,2001.6885861175363
-3805.030517578125,-100.28758811950684,10429.349155426025,10529.636743545532,1044.2747249828171
-3760.6552734375,-132.75572872161865,10323.664310455322,10456.420039176941,1082.5825500996114
-3751.409423828125,-130.23734283447266,10300.66841506958,10430.905757904053,1008.3309772736931
-3700.10107421875,-168.02088928222656,10179.18092250824,10347.201811790466,1181.434623902313
-3689.9658203125,-160.5197582244873,10152.056782722473,10312.57654094696,1050.200125455661
-3715.964111328125,-176.10945224761963,10218.66243839264,10394.771890640259,1169.57996029988
-3733.4716796875,-130.20626640319824,10256.337669372559,10386.543935775757,3956.6155815881057
-3724.572998046875,-147.7531509399414,10236.628479003906,10384.381629943848,1119.557253844226
-3562.720703125,-348.64405369758606,9862.325174093246,10210.969227790833,2913.2666715736295
-3758.61181640625,-147.95080471038818,10321.005831718445,10468.956636428833,1080.476128675155
-3721.031982421875,-131.03425991535187,10225.881408572197,10356.915668487549,1491.9782012987364
-3727.15380859375,-141.35275650024414,10242.474258422852,10383.827014923096,1255.5146164562402
-3592.111328125,-245.73863017559052,9921.40824186802,10167.14687204361,2081.40758124177
-3737.74755859375,-167.61694145202637,10272.257579803467,10439.874521255493,492.0393756419752
-3763.113525390625,-138.8283567428589,10331.497679710388,10470.326036453247,2078.8297076803037
-3802.5390625,-127.0456895828247,10427.212703704834,10554.258393287659,964.2928525879471
-3641.3828125,-233.37845420837402,10043.452338218689,10276.830792427063,1123.0917483342403
-3669.259033203125,-292.01444911956787,10118.412852287292,10410.42730140686,1163.9256726190633
-3794.9052734375,-138.6363182067871,10410.337765693665,10548.974083900452,1199.4573027508047
-3741.778076171875,-173.43704986572266,10283.99612045288,10457.433170318604,5382.009731699286
-3726.095458984375,-209.72020435333252,10248.610829353333,10458.331033706665,1033.9803240633848
-3665.8466796875,-269.12917160987854,10108.821299314499,10377.950470924377,3239.154364712111
-3782.487060546875,-106.8714427947998,10374.642189025879,10481.513631820679,486.63120003613807
-3606.594482421875,-366.0144600868225,9974.457957744598,10340.47241783142,2981.2111214679053
-3795.791015625,-121.14100646972656,10410.263760566711,10531.404767036438,444.5038349092433
-3510.50341796875,-436.5180616378784,9745.064464569092,10181.58252620697,1153.4650671172753
-3832.761962890625,-108.31228828430176,10500.309757232666,10608.622045516968,3142.1230771994683
-3814.84375,-120.98058891296387,10457.684303283691,10578.664892196655,1039.5889230438145
-3787.55908203125,-150.91755485534668,10393.913691520691,10544.831246376038,1122.9525129248848
-3832.843994140625,-116.39578533172607,10501.843368530273,10618.239153862,1961.6228643832071
-3841.095458984375,-110.7966480255127,10521.461309432983,10632.257957458496,885.9610831316141
-3452.5576171875,-522.8995840549469,9614.759398698807,10137.658982753754,2579.6033390689
