loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,8.40902279931575
-4022.2470703125,782.363122805953,4357.6483390033245,3575.2852161973715,666.2564413018558
-5517.17529296875,74.46595668792725,5881.1362590789795,5806.670302391052,1387.5574590315916
-5980.4853515625,13.665082931518555,6346.519558906555,6332.854475975037,764.3830653067141
-6218.203125,-11.119620323181152,6584.962333679199,6596.08195400238,855.4396233202555
-6425.98046875,-35.263845443725586,6793.766069412231,6829.029914855957,3298.927809486554
-6634.18603515625,-44.25328350067139,7002.054873466492,7046.308156967163,1572.998033590227
-6816.126953125,-49.67658519744873,7183.998502731323,7233.675087928772,1507.4104840264652
-6898.3642578125,-60.27387237548828,7266.886903762817,7327.160776138306,1829.3635776046322
-7078.64501953125,-79.82554054260254,7447.789284706116,7527.614825248718,2900.9984452192743
-7174.85595703125,-87.71494770050049,7544.444362640381,7632.159310340881,546.1860131360319
-7205.8544921875,-101.01564502716064,7576.527008056641,7677.542653083801,2455.6101743457557
-7349.26806640625,-103.90956592559814,7719.729767799377,7823.639333724976,1732.3762534727402
-7446.56884765625,-103.6986894607544,7816.818989753723,7920.5176792144775,1402.2445983783898
-7524.51806640625,-111.66923999786377,7895.132815361023,8006.802055358887,1416.516353151053
-7607.58935546875,-120.4651288986206,7978.511661529541,8098.976790428162,917.4323933740192
-7527.2705078125,-132.5075168609619,7899.531376838684,8032.038893699646,416.3539807691574
-7693.0615234375,-119.86073875427246,8064.061279296875,8183.9220180511475,973.43552997348
-7735.98974609375,-133.7575855255127,8107.862154006958,8241.61973953247,1946.1880777657127
-7790.0224609375,-129.4492597579956,8161.35405921936,8290.803318977356,2911.0497544126597
-7771.49169921875,-152.0584053993225,8144.356367588043,8296.414772987366,583.0181987049914
-7872.97265625,-137.27588939666748,8244.702352523804,8381.978241920471,2206.7460101490865
-7941.94091796875,-135.59758281707764,8313.446208953857,8449.043791770935,1914.0553123476222
-7911.490234375,-142.37030029296875,8283.623767852783,8425.994068145752,2216.209267207172
-7982.453125,-144.4732666015625,8354.48003578186,8498.953302383423,3305.248313982182
-8047.12646484375,-141.68369960784912,8418.906845092773,8560.590544700623,577.6485465193042
-8058.48193359375,-148.3395299911499,8430.69071483612,8579.03024482727,566.9380745426388
-8119.44775390625,-145.84873294830322,8491.370679855347,8637.21941280365,561.0110060711537
-8108.255859375,-156.5701141357422,8480.86925983429,8637.439373970032,2592.7137040985285
-8123.6142578125,-168.342924118042,8496.979489326477,8665.322413444519,1736.5742971931359
-8076.43505859375,-165.36430835723877,8449.631406784058,8614.995715141296,1590.3976514767771
-8256.30078125,-142.87755584716797,8627.825099945068,8770.702655792236,2730.4726325936417
-8276.6875,-149.29751300811768,8648.646718025208,8797.944231033325,1738.7292257053166
-8179.841796875,-167.79247522354126,8553.23085641861,8721.02333164215,4590.900725527937
-8365.9521484375,-154.42491054534912,8737.98846912384,8892.41337966919,852.4602955150563
-8360.365234375,-147.6713981628418,8731.961448669434,8879.632846832275,2281.453406302062
-8319.35546875,-165.44244813919067,8692.40325975418,8857.845707893372,2324.398734698541
-8287.517578125,-177.0433406829834,8661.23996925354,8838.283309936523,3612.281342396127
-8361.0283203125,-173.29842567443848,8734.402088165283,8907.700513839722,1634.330984725972
-8408.921875,-159.426851272583,8781.394194602966,8940.82104587555,1684.4556514256474
-8499.638671875,-155.31823921203613,8871.680663108826,9026.998902320862,5002.38528086458
-8483.5673828125,-159.30384159088135,8855.869742393494,9015.173583984375,1255.7420724975052
-8487.5205078125,-155.0827808380127,8859.842581748962,9014.925362586975,1811.7395622390757
-8601.369140625,-136.8455581665039,8972.101615905762,9108.947174072266,1453.9539539159402
-8559.58984375,-162.2881956100464,8931.809407234192,9094.097602844238,590.8701727612203
-8515.5126953125,-168.74649620056152,8888.577330589294,9057.323826789856,4018.255439183613
-8665.2412109375,-144.29578399658203,9036.449626922607,9180.74541091919,1821.291114922985
-8649.4072265625,-162.71001815795898,9021.776488304138,9184.486506462097,428.2224954024035
-8705.03125,-139.2550754547119,9075.831712722778,9215.08678817749,556.8186598695986
-8711.796875,-147.8997745513916,9083.208307266235,9231.108081817627,1199.4543348476234
-8622.7685546875,-175.83905029296875,8996.225040435791,9172.06409072876,956.7639357323598
-8794.2041015625,-142.43661785125732,9165.171511650085,9307.608129501343,2394.835924773618
-8608.8505859375,-182.0577130317688,8982.549028873444,9164.606741905212,2811.3685031591244
-8792.69921875,-151.0731372833252,9164.247278213501,9315.320415496826,2364.404485096826
-8483.9833984375,-222.93438506126404,8860.880606889725,9083.814991950989,1108.0384301029915
-8837.6376953125,-153.99648761749268,9209.232964515686,9363.229452133179,1130.505414382032
-8866.2080078125,-144.66948890686035,9237.194961547852,9381.864450454712,1789.989624112539
-8900.81640625,-149.30416870117188,9271.982118606567,9421.28628730774,600.1053456844329
-8925.8740234375,-149.11088848114014,9297.061337471008,9446.172225952148,1664.3691865293467
-8921.0478515625,-151.82473754882812,9292.426633834839,9444.251371383667,1603.2608069857922
-8913.8173828125,-159.9828805923462,9285.77820968628,9445.761090278625,1406.017145669581
-8922.828125,-155.15077114105225,9294.594158172607,9449.74492931366,1418.1621630677732
-8955.50390625,-170.01165580749512,9328.20548248291,9498.217138290405,1134.0339024259836
-8989.94140625,-146.7580165863037,9360.929647445679,9507.687664031982,3495.153746439302
-8988.28515625,-151.29081916809082,9359.726450920105,9511.017270088196,561.5703925043325
-9051.9814453125,-151.4134750366211,9423.246952056885,9574.660427093506,1063.016031513285
-9006.50390625,-168.44645500183105,9378.799471855164,9547.245926856995,2698.7218680114797
-9067.419921875,-170.3550682067871,9439.863887786865,9610.218955993652,554.3262818288985
-8868.451171875,-175.01786017417908,9241.704677820206,9416.722537994385,854.9609288745204
-9123.912109375,-153.73681640625,9495.286270141602,9649.023086547852,566.6308380505176
-9160.26171875,-149.83826637268066,9531.34236907959,9681.18063545227,693.2458150260203
-9011.396484375,-194.69445705413818,9385.522161483765,9580.216618537903,903.930423667799
-9147.171875,-159.44667148590088,9518.84568309784,9678.29235458374,1989.9845531718245
-9159.064453125,-149.35763263702393,9530.137307167053,9679.494939804077,1409.1587118007324
-9165.4033203125,-157.04964923858643,9537.015122413635,9694.064771652222,3128.443432338425
-9108.611328125,-163.61462497711182,9480.711050987244,9644.325675964355,1741.8747399608776
-9124.611328125,-175.87912130355835,9497.613213062286,9673.492334365845,2460.451314698064
-9262.2373046875,-159.23188400268555,9633.623601913452,9792.855485916138,2289.90882983972
-9264.8193359375,-156.18570518493652,9636.131273269653,9792.31697845459,574.4335385701706
-9213.021484375,-163.43273258209229,9585.03017616272,9748.462908744812,1500.5159613339563
-9222.5966796875,-164.93077659606934,9594.725949287415,9759.656725883484,3299.922541311431
-9184.12109375,-192.24019527435303,9557.986229896545,9750.226425170898,426.7839540188799
-9215.1533203125,-162.89046573638916,9587.233190536499,9750.123656272888,924.8472346911315
-9171.0087890625,-190.5204095840454,9544.84661769867,9735.367027282715,1221.6973445308686
-9144.3916015625,-213.90246868133545,9519.899771690369,9733.802240371704,1244.534247419445
-9268.54296875,-171.00930213928223,9640.872840881348,9811.88214302063,1580.5026567097
-9215.3017578125,-200.84787940979004,9589.642577171326,9790.490456581116,545.1816692953258
-9378.8212890625,-165.14995861053467,9750.621832847595,9915.77179145813,428.5017472865005
-9290.4140625,-189.33513164520264,9663.966773986816,9853.301905632019,1905.30890252553
-9450.8896484375,-158.2025146484375,9822.208475112915,9980.410989761353,3981.8822715261635
-9350.716796875,-178.00080394744873,9723.491353988647,9901.492157936096,564.4701371324522
-9417.75390625,-170.80940437316895,9789.984860420227,9960.794264793396,435.34463281905806
-9419.755859375,-164.1767978668213,9791.634721755981,9955.811519622803,438.24056434222337
-9445.2421875,-171.45659351348877,9817.448117256165,9988.904710769653,5710.676463117307
-9456.3798828125,-179.01015281677246,9828.960205078125,10007.970357894897,1904.1171311204666
-9506.0703125,-156.9292631149292,9877.261501312256,10034.190764427185,1054.1809305106979
-9434.3447265625,-188.45080184936523,9807.539080619812,9995.989882469177,926.8087899625384
-9489.7578125,-172.28289031982422,9862.052547454834,10034.335437774658,1521.7930661683565
-9467.2421875,-178.06112957000732,9839.946902275085,10018.008031845093,1302.9063515996268
-9566.830078125,-173.3856658935547,9938.882474899292,10112.268140792847,918.3590152450543
-9539.7021484375,-173.17392826080322,9911.982789039612,10085.156717300415,3357.245595330507
-9581.4892578125,-170.5189504623413,9953.428027153015,10123.946977615356,2978.8730295695386
-9522.873046875,-190.06324863433838,9896.023006439209,10086.086255073547,2764.346507310069
-9501.66796875,-199.86652660369873,9875.624467849731,10075.49099445343,1728.26435584804
-9567.267578125,-180.07422924041748,9940.145522117615,10120.219751358032,1786.8079287103121
-9378.3291015625,-210.72706842422485,9753.470659732819,9964.197728157043,2756.31764465501
-9685.90234375,-171.43938732147217,10057.751065254211,10229.190452575684,3154.717408027193
-9575.130859375,-189.30683135986328,9948.19938659668,10137.506217956543,440.62708544797647
-9617.0166015625,-176.06476593017578,9989.3337059021,10165.398471832275,1432.3035813373908
-9622.669921875,-197.14963722229004,9996.212934494019,10193.362571716309,1917.840044066914
-9692.68359375,-167.82831478118896,10064.38420009613,10232.21251487732,595.5657641322897
-9632.2666015625,-182.53538417816162,10005.004900932312,10187.540285110474,1168.275957488598
-9714.8603515625,-175.93507385253906,10087.006338119507,10262.941411972046,2551.0647918206696
-9593.2568359375,-197.35414123535156,9967.235618591309,10164.58975982666,2261.1583439554474
-9725.21484375,-179.11537170410156,10097.659260749817,10276.774632453918,4116.246929373107
-9680.455078125,-193.16424179077148,10053.835083007812,10246.999324798584,546.289693415559
-9744.6376953125,-178.74999618530273,10117.037761688232,10295.787757873535,1283.929453563255
-9555.3037109375,-223.06859683990479,9930.861352920532,10153.929949760437,1155.9462314861491
-9607.7353515625,-213.9152810573578,9982.689388513565,10196.604669570923,1693.4236717955755
-9766.033203125,-174.5833978652954,10138.265446662903,10312.848844528198,586.9490285214052
-9743.44140625,-179.71902751922607,10116.045310974121,10295.764338493347,2441.3971367388776
-9811.537109375,-174.56219482421875,10183.468091964722,10358.03028678894,2087.5870455321024
-9750.4697265625,-188.0881061553955,10123.578734397888,10311.666840553284,1557.6067310192134
-9734.220703125,-196.1489553451538,10107.87850856781,10304.027463912964,2165.749058903146
-9478.71484375,-275.53814029693604,9857.556963920593,10133.09510421753,2105.122366790083
-9823.033203125,-178.69489765167236,10195.420182228088,10374.11507987976,4446.387903601995
-9799.669921875,-190.98004245758057,10172.931903839111,10363.911946296692,549.3162085749827
-9891.8154296875,-186.72252655029297,10264.527128219604,10451.249654769897,2160.6875544029444
-9697.9033203125,-205.04366660118103,10072.477073907852,10277.520740509033,2124.3290092789007
-9764.9619140625,-217.89282035827637,10139.773887634277,10357.666707992554,1475.927748934099
-9904.1025390625,-175.25938606262207,10276.187191009521,10451.446577072144,4025.773061688366
-9862.2490234375,-189.18932723999023,10235.232020378113,10424.421347618103,1341.1950152362742
-9702.0185546875,-233.58454084396362,10078.128495693207,10311.71303653717,1241.8560959770373
-9804.4267578125,-215.93759632110596,10179.25355052948,10395.191146850586,439.9213146545477
-9878.130859375,-184.45125579833984,10250.955567359924,10435.406823158264,1802.9382821420174
-9968.87890625,-173.0556240081787,10340.785503387451,10513.84112739563,1788.3607679339389
-9720.427734375,-226.19994115829468,10096.182248592377,10322.382189750671,1175.4691791754976
-9882.7001953125,-198.37208032608032,10256.5297665596,10454.901846885681,533.5541176378625
-9932.5400390625,-199.58183002471924,10306.151267051697,10505.733097076416,2715.536645713576
-9993.6640625,-176.27873992919922,10365.70764541626,10541.986385345459,3680.4909306277827
-9897.85546875,-210.46125888824463,10272.236233711243,10482.697492599487,1927.9437333238388
-9800.5029296875,-223.38305377960205,10175.834033966064,10399.217087745667,564.063500262307
-9998.23828125,-187.41321086883545,10371.036396980286,10558.449607849121,2829.1024367802283
-9980.5556640625,-200.25748348236084,10354.200716972351,10554.458200454712,550.2038637410857
-9823.119140625,-228.91536903381348,10198.816268920898,10427.731637954712,575.3577352032579
-9810.5673828125,-238.5276701450348,10186.953936338425,10425.48160648346,574.5110608464167
-10053.2958984375,-185.19932556152344,10425.802053451538,10611.001379013062,1179.5368200654225
-9841.8486328125,-237.78956747055054,10218.239703655243,10456.029271125793,556.924009436437
-9773.814453125,-271.5791120529175,10152.102935791016,10423.682047843933,537.1406711380971
-9852.1669921875,-260.4240093231201,10229.548369407654,10489.972378730774,1844.3270188552622
-10118.9130859375,-183.78273963928223,10491.266576766968,10675.04931640625,570.9901757290473
-10052.5595703125,-193.6305742263794,10425.749665260315,10619.380239486694,562.5413442701266
-9897.884765625,-279.02139377593994,10276.121615409851,10555.143009185791,2032.291353866673
-9930.0322265625,-225.0744104385376,10305.37408733368,10530.448497772217,573.2576052559803
-10061.271484375,-211.73862838745117,10435.464429855347,10647.203058242798,540.3382882344615
-10101.03515625,-210.94690895080566,10475.090337753296,10686.037246704102,1342.469707737369
-9839.26171875,-255.0877604484558,10216.399331569672,10471.487092018127,1232.996711558846
-9962.095703125,-219.32458972930908,10337.12868309021,10556.453272819519,590.2295796211927
-10088.498046875,-192.0224552154541,10461.647840499878,10653.670295715332,600.4515169680936
-9835.859375,-282.1636643409729,10214.874735355377,10497.03839969635,1040.7793078125894
-10075.9853515625,-218.57930088043213,10450.899820327759,10669.479121208191,1975.902400409574
-10219.1533203125,-166.12497329711914,10590.414333343506,10756.539306640625,2067.16827361486
-10085.2177734375,-214.81590270996094,10459.716236114502,10674.532138824463,494.6393944205037
-10153.703125,-205.78008937835693,10527.325675964355,10733.105765342712,435.41867110171887
-10124.3720703125,-206.5284299850464,10498.332776069641,10704.861206054688,564.9984021348106
-10171.2626953125,-196.85177040100098,10544.55464553833,10741.406415939331,567.7776987638828
-10147.7705078125,-202.16472148895264,10521.534029960632,10723.698751449585,440.7316754879943
-10142.060546875,-208.20933151245117,10516.081270217896,10724.290601730347,1555.6201320565963
-10236.947265625,-193.35990524291992,10609.917510986328,10803.277416229248,586.199353120859
-10068.09765625,-231.32316172122955,10443.983524680138,10675.306686401367,3001.6835389567523
-10143.751953125,-211.65584087371826,10518.23874759674,10729.894588470459,1164.0438826928867
-10223.5322265625,-217.06968021392822,10598.09883403778,10815.168514251709,1069.4636987509944
-10170.3505859375,-199.02578926086426,10543.719116210938,10742.744905471802,2735.4911417566364
-10096.427734375,-231.532555103302,10472.061909198761,10703.594464302063,523.2459351636068
-10049.4794921875,-258.8898801803589,10426.908843040466,10685.798723220825,3881.570435808992
-10110.3046875,-235.50852298736572,10486.189764976501,10721.698287963867,439.78258813341324
-10295.87890625,-189.9108772277832,10668.731884002686,10858.642761230469,423.814628083601
-10174.431640625,-225.42820072174072,10549.717574119568,10775.145774841309,461.6795935190056
-10389.6328125,-180.29322242736816,10761.601686477661,10941.89490890503,476.4724239216718
-10229.2529296875,-210.3629093170166,10603.316078186035,10813.678987503052,929.9770192994843
-10375.43359375,-195.44672966003418,10748.395601272583,10943.842330932617,1368.0293554579323
-10397.0,-183.423246383667,10769.134454727173,10952.55770111084,455.8549049003843
-10069.505859375,-259.73409700393677,10447.063596248627,10706.797693252563,2182.4137197224522
-10374.8955078125,-195.03954315185547,10747.873853683472,10942.913396835327,2441.769013363839
-10384.4580078125,-200.8367042541504,10757.633380889893,10958.470085144043,1301.9611416966186
-9916.423828125,-354.0664792060852,10300.53931093216,10654.605790138245,464.19107590573515
-10115.927734375,-239.14322662353516,10491.74717617035,10730.890402793884,1656.8813502412245
-10362.55859375,-191.39537143707275,10735.31762599945,10926.712997436523,457.0710685594344
-10302.7216796875,-221.71229648590088,10677.625807762146,10899.338104248047,2796.606396869743
-10272.2626953125,-227.05374717712402,10647.53816986084,10874.591917037964,902.4519260485628
-10316.75390625,-233.8970012664795,10692.069610595703,10925.966611862183,1179.0003585321308
-10274.5576171875,-235.90299034118652,10650.211666107178,10886.114656448364,3272.1223056876493
-10373.7783203125,-202.040207862854,10747.337058067322,10949.377265930176,528.0116935414711
-10354.5751953125,-220.65893173217773,10729.190603256226,10949.849534988403,1462.339399003534
-10132.5244140625,-304.7701940536499,10512.574850082397,10817.345044136047,2331.708650543809
-10251.732421875,-256.9559602737427,10628.701272010803,10885.657232284546,491.5246635390671
-10423.0439453125,-208.07607078552246,10796.835209846497,11004.911280632019,1986.6015366736424
-10093.33984375,-271.5007175207138,10471.947628617287,10743.448346138,1794.4191692340817
-10362.7099609375,-210.5242462158203,10736.891916275024,10947.416162490845,1259.1859981472955
-10456.630859375,-205.12564373016357,10830.228713035583,11035.354356765747,422.8552101019937
-10466.9169921875,-198.8701992034912,10840.125560760498,11038.99575996399,937.4390923880966
