loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,9.014115221755956
-12266.0693359375,728.3255868032575,4201.427557319403,3473.1019705161452,682.7187100144369
-16947.064453125,22.162745475769043,5770.975794792175,5748.813049316406,876.5435811526543
-17971.349609375,-10.844902038574219,6112.690360069275,6123.535262107849,624.5182612116259
-18854.505859375,-34.25249767303467,6407.18341255188,6441.435910224915,1127.736549135011
-19623.984375,-39.720993995666504,6663.6669273376465,6703.387921333313,1141.6463630990822
-20149.37109375,-34.168479919433594,6838.637588500977,6872.80606842041,581.4293227730885
-20520.748046875,-41.610087394714355,6962.529557228088,7004.139644622803,962.7422984410755
-21024.146484375,-42.678603172302246,7130.222381591797,7172.900984764099,2044.3654846174425
-21489.318359375,-35.610833168029785,7285.041272163391,7320.652105331421,2213.9413990882786
-21601.40625,-50.78882169723511,7322.834365367889,7373.6231870651245,2139.021210849996
-21846.41015625,-56.505197525024414,7404.410378456116,7460.91557598114,1071.2027623820677
-22323.140625,-51.56993293762207,7563.212799072266,7614.782732009888,2029.0617571821529
-22629.751953125,-48.69349479675293,7665.313940048218,7714.007434844971,1103.5037450167238
-22906.728515625,-47.57341194152832,7757.567451477051,7805.140863418579,1118.2210558956845
-23105.810546875,-63.468926429748535,7824.204149246216,7887.673075675964,1324.203824072575
-23394.16015625,-58.78881645202637,7920.216821670532,7979.005638122559,1175.943161364759
-23578.83203125,-65.10726070404053,7981.865456581116,8046.972717285156,1204.8048854136498
-23750.970703125,-72.1571159362793,8039.36452960968,8111.5216455459595,3708.2005990741945
-23841.943359375,-80.72411918640137,8069.854221343994,8150.5783405303955,1308.5182592619108
-23937.51953125,-87.36580848693848,8101.864722251892,8189.230530738831,1713.7422484938163
-24216.291015625,-87.66995143890381,8194.755075454712,8282.425026893616,1125.3770753526271
-24363.029296875,-78.50955772399902,8243.477381706238,8321.986939430237,868.0195932481454
-24301.90234375,-98.78342247009277,8223.530654907227,8322.31407737732,1440.3650283755098
-24543.5078125,-87.09978771209717,8303.79847240448,8390.898260116577,1101.384314599919
-24727.171875,-81.20281314849854,8364.880117416382,8446.08293056488,1983.3832859533775
-24579.302734375,-92.66662120819092,8315.93552684784,8408.60214805603,1156.8416439995228
-24856.66015625,-98.7288875579834,8408.432666778564,8507.161554336548,1836.6230791981347
-25038.486328125,-81.65768146514893,8468.653952598572,8550.31163406372,3846.8037534500895
-25135.376953125,-82.98054313659668,8500.972226142883,8583.95276927948,2336.204539049049
-25375.03125,-80.3382625579834,8580.710611343384,8661.048873901367,1328.2822991042397
-25291.484375,-79.49825096130371,8552.901063919067,8632.399314880371,2525.1997980336796
-25472.6640625,-83.38473701477051,8613.334498405457,8696.719235420227,1655.7628301107754
-25522.548828125,-86.15374755859375,8630.042116165161,8716.195863723755,866.9668365103645
-25799.4140625,-82.7530345916748,8722.188362121582,8804.941396713257,1505.289223294137
-25696.146484375,-83.3212833404541,8687.915254592896,8771.23653793335,1684.7175140769075
-25631.775390625,-94.61296653747559,8666.69728565216,8761.310252189636,2520.027473597051
-25560.462890625,-113.52374458312988,8643.315755844116,8756.839500427246,2416.0777245942472
-25912.087890625,-107.05178642272949,8760.418509483337,8867.470295906067,887.740154983281
-25627.111328125,-120.60144138336182,8665.529612541199,8786.13105392456,1063.377053806599
-26205.083984375,-78.76171684265137,8857.338096618652,8936.099813461304,1551.1487895832543
-25927.53125,-125.5528359413147,8765.856830120087,8891.409666061401,5048.470793892139
-26272.560546875,-85.2989673614502,8880.01923751831,8965.31820487976,1601.6689751811682
-26276.55078125,-98.7168960571289,8881.592485427856,8980.309381484985,1328.3377122018496
-26397.642578125,-96.87232780456543,8921.924534797668,9018.796862602234,1290.1392460223767
-26185.568359375,-126.96320915222168,8851.886800765991,8978.850009918213,1426.7809252902073
-26555.0625,-91.89062023162842,8974.306234359741,9066.19685459137,1171.3730349176021
-26646.537109375,-92.5370740890503,9004.685862541199,9097.222936630249,768.5634956467072
-26811.30859375,-70.36102867126465,9059.291080474854,9129.652109146118,1339.2101605994508
-26721.865234375,-97.45331382751465,9029.990210533142,9127.443524360657,1611.047562204124
-26904.333984375,-71.22964382171631,9090.242408752441,9161.472052574158,1583.1662478349247
-26956.02734375,-81.86300468444824,9107.687007904053,9189.550012588501,1243.1105079374524
-27201.93359375,-76.7472448348999,9189.481360435486,9266.228605270386,1169.3310722981444
-27066.525390625,-80.9994535446167,9144.50650024414,9225.505953788757,861.3122541063631
-27005.990234375,-92.22867584228516,9124.5693359375,9216.798011779785,1160.842270458754
-27301.2890625,-81.35839748382568,9222.719984054565,9304.078381538391,677.0126810820714
-27167.6484375,-86.93560791015625,9178.385228157043,9265.3208360672,1116.049917088453
-27378.904296875,-86.3460340499878,9248.709714889526,9335.055748939514,830.5603811465191
-27386.65625,-89.76780986785889,9251.368697166443,9341.136507034302,1158.677090586259
-27171.50390625,-108.82952356338501,9180.144462108612,9288.973985671997,1220.4686697205207
-26951.044921875,-129.86463594436646,9107.099259853363,9236.96389579773,1880.0083538553488
-27784.76953125,-61.96006107330322,9383.46757030487,9445.427631378174,1140.4627805179136
-27589.875,-85.22765827178955,9319.073018074036,9404.300676345825,1444.4796208669375
-27599.4140625,-86.33726596832275,9322.232299804688,9408.56956577301,2049.0752721067033
-27474.2265625,-93.84473896026611,9280.732515335083,9374.57725429535,1047.6752537004447
-27766.771484375,-80.00685596466064,9377.88136768341,9457.888223648071,1041.5494315125266
-27839.765625,-75.80551719665527,9402.11955833435,9477.925075531006,1659.1529069944838
-28075.931640625,-66.31349658966064,9480.605868339539,9546.9193649292,1147.7507569244651
-27860.34765625,-81.4647912979126,9409.131180763245,9490.595972061157,1781.2693737881052
-27733.56640625,-104.90307140350342,9367.384140014648,9472.287211418152,3471.4555390088617
-28004.857421875,-87.20736026763916,9457.429270744324,9544.636631011963,1081.5888708423151
-28255.22265625,-74.26461791992188,9540.486473083496,9614.751091003418,1512.5359796984096
-28320.55859375,-70.61783504486084,9562.204461097717,9632.822296142578,1880.5941305679814
-28129.474609375,-85.37611198425293,9498.862131118774,9584.238243103027,1679.443995719491
-28338.060546875,-84.09172248840332,9568.330335617065,9652.422058105469,1875.4239996947886
-28445.546875,-64.38637828826904,9603.780968666077,9668.167346954346,1838.5982632635694
-28163.064453125,-98.7064208984375,9510.34567451477,9609.052095413208,895.5158936572501
-28121.958984375,-111.11151504516602,9496.989158630371,9608.100673675537,2545.901861703169
-28575.328125,-74.17773818969727,9647.211971282959,9721.389709472656,1699.8969601999986
-28758.1796875,-68.3536548614502,9707.998085021973,9776.351739883423,2929.1513273043433
-28591.994140625,-82.96665382385254,9652.937656402588,9735.90431022644,1188.7006507986605
-28659.25,-82.52157402038574,9675.32876586914,9757.850339889526,1706.5062305904792
-28044.591796875,-144.61850452423096,9471.93630027771,9616.554804801941,1073.696261886446
-28702.015625,-80.59591102600098,9689.624160766602,9770.220071792603,1369.7224923828862
-28848.6640625,-82.4008846282959,9738.459819793701,9820.860704421997,1977.8133751872374
-28645.6953125,-107.44342803955078,9671.313076019287,9778.756504058838,1702.7155501994002
-28933.5546875,-86.21386623382568,9766.832911491394,9853.04677772522,1871.3175735828481
-28852.2265625,-85.71480369567871,9739.761068344116,9825.475872039795,1031.315223732784
-28980.52734375,-84.26495361328125,9782.443599700928,9866.708553314209,1552.8136337163644
-28778.150390625,-99.52180099487305,9715.352391242981,9814.874192237854,1289.6974153862213
-28703.41015625,-112.78904151916504,9690.737302780151,9803.526344299316,1052.0771694041634
-28960.763671875,-99.6044397354126,9776.16815662384,9875.772596359253,1049.2858654419208
-28964.8359375,-99.19697284698486,9777.549528121948,9876.746500968933,1316.1865216004219
-28831.66015625,-125.35887622833252,9733.72961139679,9859.088487625122,1167.101562193728
-29148.560546875,-85.68865394592285,9838.491269111633,9924.179923057556,1846.7749713188205
-28863.76171875,-133.29391717910767,9744.575663089752,9877.86958026886,1023.8971384213054
-29428.59375,-71.64175796508789,9931.436199188232,10003.07795715332,1245.802045182049
-29117.794921875,-102.00060749053955,9828.587501525879,9930.588109016418,1488.1259346484428
-28852.6015625,-120.12038612365723,9740.667271614075,9860.787657737732,2282.5895904409217
-29322.724609375,-96.2571268081665,9896.714226722717,9992.971353530884,1158.7230961584125
-29179.677734375,-103.87715911865234,9849.240938186646,9953.118097305298,1223.1511690645436
-29084.271484375,-133.82649993896484,9818.026651382446,9951.853151321411,1395.4458690943134
-29364.712890625,-105.3937292098999,9910.887917518616,10016.281646728516,1150.6876565580076
-29586.720703125,-90.66758632659912,9984.625981330872,10075.29356765747,1251.2076468640544
-29096.88671875,-135.65824699401855,9822.346292495728,9958.004539489746,1235.2429569199398
-29372.689453125,-105.12005710601807,9913.633334159851,10018.75339126587,1271.3702429855093
-29651.685546875,-80.66688919067383,10006.039915084839,10086.706804275513,1384.7835164410997
-29649.3125,-90.2589168548584,10005.452493667603,10095.711410522461,978.7919945824086
-29636.40625,-92.82949161529541,10001.165501594543,10093.994993209839,1286.1116965116187
-29554.095703125,-104.32326316833496,9974.07831954956,10078.401582717896,1895.634272525527
-29792.607421875,-94.11202621459961,10053.284595489502,10147.396621704102,1205.5806741393953
-29525.810546875,-138.85308170318604,9965.340132713318,10104.193214416504,1256.8785344448468
-29188.154296875,-146.65646839141846,9853.067274570465,9999.723742961884,2068.3840460114675
-30032.427734375,-81.36362648010254,10132.917728424072,10214.281354904175,1492.7872147109565
-29298.873046875,-170.59821224212646,9890.413457870483,10061.01167011261,2071.907982158606
-30002.3671875,-92.91910362243652,10123.110189437866,10216.029293060303,1908.322453925982
-29985.37890625,-100.04877185821533,10117.594723701477,10217.643495559692,3101.6942236216178
-29527.73828125,-160.6803159713745,9966.414820671082,10127.095136642456,1640.3015162554225
-29654.263671875,-128.58127975463867,10007.91455078125,10136.495830535889,2026.6137872898098
-29752.8828125,-122.27344989776611,10040.691521644592,10162.964971542358,1148.115418467696
-29810.6171875,-115.20101642608643,10059.723427772522,10174.924444198608,1154.1015484305171
-30016.306640625,-111.29915523529053,10128.158909797668,10239.458065032959,925.9172620012105
-30224.568359375,-96.37399291992188,10197.211488723755,10293.585481643677,1899.1008160747565
-30139.876953125,-99.91799831390381,10169.089484214783,10269.007482528687,1069.8488005214883
-29876.0390625,-136.21616554260254,10081.964664459229,10218.180830001831,1242.9186126545292
-29648.6484375,-144.26722812652588,10006.37961769104,10150.646845817566,2261.098678576792
-29889.3359375,-129.61058235168457,10086.285135269165,10215.89571762085,1920.3659305978688
-29560.580078125,-166.0722074508667,9977.526330947876,10143.598538398743,1334.2774184726775
-30300.13671875,-103.3047866821289,10222.553140640259,10325.857927322388,2362.239324484091
-29600.982421875,-172.62575912475586,9991.088559150696,10163.714318275452,1879.3761543945423
-29609.40234375,-188.35587739944458,9994.259293079376,10182.61517047882,2128.992055282976
-30360.25,-104.76107406616211,10242.642282485962,10347.403356552124,3279.7676222857217
-29336.935546875,-161.38052463531494,9902.887565612793,10064.268090248108,1870.8389673510535
-30176.828125,-123.27557277679443,10181.945157051086,10305.22072982788,1587.783336002588
-30006.61328125,-162.74455499649048,10126.045308589935,10288.789863586426,1872.2404232989143
-30367.25,-113.80202674865723,10245.194544792175,10358.996571540833,917.2922471183787
-30300.220703125,-112.60601329803467,10222.818360328674,10335.424373626709,1125.0514453554497
-30565.2734375,-114.91251945495605,10311.165002822876,10426.077522277832,1362.0215656607718
-30347.833984375,-110.86744499206543,10238.676060676575,10349.54350566864,1797.7032481560566
-30567.71875,-95.55247497558594,10311.627424240112,10407.179899215698,1571.1872110941365
-30558.95703125,-111.07167434692383,10309.001810073853,10420.073484420776,3491.9058056886884
-29731.7109375,-191.81902360916138,10035.134478092194,10226.953501701355,1411.76424258852
-30326.458984375,-134.34650659561157,10232.107636928558,10366.45414352417,2113.824948281366
-30597.6796875,-111.3803186416626,10321.905505180359,10433.285823822021,1647.551312297178
-30222.26953125,-153.51664447784424,10197.695118904114,10351.211763381958,1236.1981191492569
-30773.056640625,-98.50330448150635,10380.153769493103,10478.65707397461,1603.0393245555179
-30368.84375,-137.3428430557251,10246.27772808075,10383.620571136475,1189.3695478213463
-30367.619140625,-148.1099967956543,10246.077738761902,10394.187735557556,1472.9517373147635
-30450.630859375,-158.70353984832764,10273.912957191467,10432.616497039795,1060.604168069628
-30669.64453125,-123.58291244506836,10346.142395019531,10469.7253074646,1940.0928315015935
-30521.572265625,-129.53337955474854,10296.998852729797,10426.532232284546,2415.19052420703
-30616.224609375,-130.55245685577393,10328.516980171204,10459.069437026978,1902.493390136598
-30791.25390625,-114.48852157592773,10386.507955551147,10500.996477127075,1194.1577002036554
-30531.634765625,-137.6789960861206,10300.49061870575,10438.16961479187,1273.611018032748
-30370.04296875,-165.5795669555664,10247.26279258728,10412.842359542847,2429.2000319806907
-30895.5078125,-109.89175796508789,10421.14554977417,10531.037307739258,1316.1109057839597
-30457.8515625,-136.5271110534668,10275.926559448242,10412.453670501709,1242.0571427488408
-30482.654296875,-150.0248498916626,10284.504683494568,10434.52953338623,2646.659426563587
-31137.0703125,-100.76342678070068,10501.463196754456,10602.226623535156,770.6048468504551
-31157.53125,-94.49076557159424,10508.124127388,10602.614892959595,1913.041234087368
-30322.685546875,-166.22425174713135,10231.493220329285,10397.717472076416,1098.0445576708037
-30717.337890625,-150.61333465576172,10362.634828567505,10513.248163223267,1223.9824913842376
-30781.015625,-120.67040252685547,10383.275789260864,10503.94619178772,2361.9516753895027
-30951.578125,-131.63019180297852,10440.26072883606,10571.890920639038,1996.9119173914155
-30922.10546875,-129.37809658050537,10430.452787399292,10559.830883979797,1914.4138880771811
-30271.712890625,-163.46324110031128,10214.50517129898,10377.968412399292,1145.4996584883538
-31128.90234375,-125.36962795257568,10499.216153144836,10624.585781097412,1155.0899310853647
-30925.498046875,-144.01935195922852,10431.89243888855,10575.911790847778,1560.8360615426984
-31293.16015625,-97.55598735809326,10553.441463470459,10650.997450828552,1529.1015116945894
-30873.505859375,-146.16036987304688,10414.632108688354,10560.792478561401,1195.120747060075
-31112.1015625,-119.67869758605957,10493.572500228882,10613.251197814941,1127.7931227047009
-31140.845703125,-114.79961967468262,10503.106578826904,10617.906198501587,1334.7416021669692
-30908.060546875,-142.63237857818604,10426.056900978088,10568.689279556274,1112.8275419957006
-31465.140625,-94.33433437347412,10610.713448524475,10705.04778289795,1298.662481049296
-31438.384765625,-100.08429145812988,10601.848150253296,10701.932441711426,1161.740492430549
-31373.033203125,-108.04515075683594,10580.274574279785,10688.319725036621,1977.6516738237342
-31051.259765625,-152.08119201660156,10473.909353256226,10625.990545272827,1732.361422112093
-31423.865234375,-126.25442600250244,10597.541420936584,10723.795846939087,1732.252699138033
-30785.1875,-193.7726058959961,10386.12124824524,10579.893854141235,1198.0844789527907
-31512.65625,-108.63467502593994,10626.799174308777,10735.433849334717,1103.1804914713891
-31367.380859375,-136.54094409942627,10578.950995445251,10715.491939544678,973.4049470975872
-30892.818359375,-159.80252265930176,10421.422956466675,10581.225479125977,1829.4275461947325
-31476.841796875,-115.73433017730713,10615.011351585388,10730.745681762695,3811.0821816062044
-31396.958984375,-118.18884086608887,10588.477977752686,10706.666818618774,714.5091969548257
-31725.83984375,-108.80370235443115,10697.807448387146,10806.611150741577,2225.2446575535123
-30983.548828125,-171.76469039916992,10451.822525024414,10623.587215423584,1210.7967551730549
-30995.763671875,-164.05128860473633,10455.812767982483,10619.86405658722,1529.9680789419488
-31341.103515625,-145.8815402984619,10570.46272945404,10716.344269752502,1900.459581087323
-31198.935546875,-141.30043411254883,10522.984943389893,10664.285377502441,504.5711883835751
-31479.052734375,-133.43717002868652,10616.134998321533,10749.57216835022,1216.637628835128
-31762.17578125,-96.08522605895996,10709.674835205078,10805.760061264038,1987.5372492460629
-31495.546875,-120.3474817276001,10621.395058631897,10741.742540359497,1056.8106097155585
-31593.849609375,-101.28518295288086,10653.764720916748,10755.049903869629,1506.6931248973572
-31262.658203125,-147.69105529785156,10544.314905166626,10692.005960464478,2936.702345404414
-31566.80859375,-136.25061225891113,10645.405742645264,10781.656354904175,1521.7927787407873
-31224.45703125,-161.4632740020752,10531.876628875732,10693.339902877808,1214.7844141298767
-31802.673828125,-106.40942096710205,10723.390442848206,10829.799863815308,1272.9378513173742
-31657.23046875,-121.98607063293457,10675.305952072144,10797.292022705078,1484.7781221937053
-31368.541015625,-146.5670862197876,10579.589037895203,10726.15612411499,3689.0526599090335
-31479.1875,-149.17863655090332,10616.493151664734,10765.671788215637,1217.1821351292058
-31713.65234375,-124.43242263793945,10694.158201217651,10818.59062385559,1594.9205984218236
