loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,2.626249569442986
-3514.37841796875,1173.348876670003,4156.5496035814285,2983.2007269114256,864.15121753146
-5004.70751953125,557.6989116668701,5699.655264854431,5141.956353187561,1282.6403963515859
-5461.103515625,527.3924217224121,6132.42234992981,5605.0299282073975,827.633671409171
-5718.802734375,533.8388223648071,6375.183533668518,5841.344711303711,933.1322935625622
-6046.42529296875,530.3964767456055,6690.206878662109,6159.810401916504,980.0622803352774
-6259.7509765625,541.2412967681885,6894.915984153748,6353.674687385559,477.52877016267627
-6434.18115234375,533.1901226043701,7067.454442024231,6534.264319419861,2981.7687977249734
-6566.39794921875,521.1168460845947,7199.767249107361,6678.650403022766,470.5561848724958
-6708.943359375,510.66129302978516,7344.839405059814,6834.178112030029,880.3129614366558
-6843.2421875,522.7232246398926,7471.969372749329,6949.246148109436,973.3552286942779
-6920.5048828125,509.11148166656494,7555.305559158325,7046.19407749176,378.15043332922306
-7017.5791015625,496.68419075012207,7653.727960586548,7157.043769836426,381.3121560015156
-7090.08544921875,493.7837619781494,7725.233995437622,7231.450233459473,893.4843569494693
-7171.0048828125,485.3709135055542,7809.670531272888,7324.299617767334,1484.8321302539043
-7233.88232421875,473.72565269470215,7876.237531661987,7402.511878967285,1149.3906393290877
-7319.4150390625,475.4370365142822,7960.7062339782715,7485.269197463989,984.6815466279877
-7027.46484375,384.1307439804077,7716.897500038147,7332.766756057739,607.0350065782965
-7483.8232421875,461.7225284576416,8124.254364013672,7662.53183555603,1085.7948532984085
-7299.18115234375,442.21347093582153,7956.218990802765,7514.005519866943,5294.095445287976
-7563.099609375,458.22232151031494,8207.407753944397,7749.185432434082,983.7815502426292
-7635.48486328125,454.53276348114014,8278.828450202942,7824.295686721802,931.6550953811256
-7743.2919921875,460.5481309890747,8380.757016181946,7920.208885192871,954.7864418556522
-7792.83203125,456.62889766693115,8431.579442977905,7974.950545310974,805.6399758663983
-7813.3671875,450.1779851913452,8453.805333137512,8003.627347946167,890.6688709699745
-7679.9560546875,413.9325659275055,8342.628867864609,7928.696301937103,1048.830765702875
-7906.02001953125,438.0825147628784,8550.19806098938,8112.1155462265015,956.3444721874433
-7936.2451171875,442.6396417617798,8580.825003623962,8138.185361862183,921.7485652581056
-7901.51220703125,427.45963168144226,8551.667995929718,8124.208364248276,1322.329791540322
-8060.87548828125,438.5719003677368,8703.693084716797,8265.12118434906,980.206724266294
-8084.9140625,441.3022356033325,8725.757399559021,8284.455163955688,1410.8994925149948
-8034.58154296875,424.5633707046509,8686.02008342743,8261.456712722778,401.8360305369796
-8155.744140625,426.49921703338623,8802.156015396118,8375.656798362732,402.603973227617
-8208.4091796875,422.9667625427246,8854.086035728455,8431.11927318573,547.3149551445954
-8216.0185546875,424.953164100647,8862.858857154846,8437.9056930542,6823.402543344813
-8218.05859375,420.7547245025635,8866.104956626892,8445.350232124329,1068.4001409427603
-8042.8046875,362.32276010513306,8723.659356594086,8361.336596488953,411.9078018823257
-7910.7646484375,373.2055621147156,8590.227274894714,8217.021712779999,864.2034284235386
-8271.29296875,412.67618560791016,8925.09814453125,8512.42195892334,815.6942510938742
-8361.53125,410.5712203979492,9010.066520690918,8599.495300292969,620.170252837933
-8365.365234375,410.06640625,9018.09203529358,8608.02562904358,881.6165071697055
-8214.966796875,387.3128162622452,8882.148560166359,8494.835743904114,880.9949078631754
-8505.119140625,420.6164216995239,9146.26976776123,8725.653346061707,865.3334514701158
-8351.654296875,403.05169332027435,9007.887961149216,8604.836267828941,936.7248231680388
-8425.251953125,402.071475982666,9082.80081653595,8680.729340553284,481.34258682676915
-8454.8974609375,402.4561405181885,9110.80550289154,8708.349362373352,843.3045066477043
-8459.7099609375,406.0257730484009,9112.20135974884,8706.17558670044,441.0457324030915
-8571.126953125,415.81510734558105,9215.629354476929,8799.814247131348,486.7826515852056
-8639.4140625,416.06940937042236,9280.82930469513,8864.759895324707,919.9091488328681
-8386.0185546875,372.3617541193962,9059.394511163235,8687.032757043839,5790.929496712363
-8367.626953125,363.4533338546753,9042.949170589447,8679.495836734772,462.5837128145176
-8608.6708984375,399.8766393661499,9260.56566619873,8860.68902683258,933.6506134173324
-8618.37890625,416.68104457855225,9266.56422996521,8849.883185386658,1352.5992746532227
-8300.5078125,330.4955608844757,8997.848667860031,8667.353106975555,400.7530589895481
-8753.357421875,415.37500858306885,9393.710021972656,8978.335013389587,729.2602847811125
-8760.5234375,425.5593032836914,9399.825330734253,8974.266027450562,403.98225508729917
-8600.234375,385.1749292612076,9262.122976064682,8876.948046803474,3062.841787603255
-8506.5859375,384.6877792477608,9170.918729662895,8786.230950415134,859.0452406937698
-8762.607421875,411.67816638946533,9408.641736030579,8996.963569641113,1301.1415709083508
-8817.919921875,414.7502088546753,9459.335004806519,9044.584795951843,1736.2787611468796
-8841.873046875,425.75677967071533,9480.670986175537,9054.914206504822,508.5404838005559
-8553.2138671875,368.07714462280273,9227.594095230103,8859.5169506073,6879.828725574498
-8886.9033203125,418.78225898742676,9525.263228416443,9106.480969429016,655.1309499815595
-8691.1376953125,383.8772747516632,9354.556239366531,8970.678964614868,434.0954039202368
-8925.1845703125,423.21462631225586,9561.775521278381,9138.560894966125,508.4673734037373
-8895.7158203125,405.2307462692261,9540.115416526794,9134.884670257568,408.45747516311843
-8766.087890625,388.75655603408813,9425.779319763184,9037.022763729095,973.4063024435683
-9002.150390625,421.79194259643555,9637.527446746826,9215.73550415039,866.2547852027677
-8891.1708984375,410.7348380088806,9537.742549419403,9127.007711410522,383.54131898823886
-8610.9775390625,328.83918967843056,9301.70078626275,8972.86159658432,1039.8786395572977
-8635.23046875,329.26322746276855,9324.207691192627,8994.944463729858,868.4281068959915
-8928.740234375,407.1805806159973,9575.952029705048,9168.77144908905,834.8757981343452
-8791.09765625,366.8633842468262,9459.726560592651,9092.863176345825,436.6956827960703
-9125.2177734375,440.3696069717407,9753.631233215332,9313.261626243591,1967.1698958389293
-8970.126953125,410.0748338699341,9617.315185546875,9207.240351676941,442.2892881301607
-8967.2353515625,397.44426560401917,9619.117244005203,9221.672978401184,958.4711713940716
-9011.607421875,405.02639961242676,9658.43874835968,9253.412348747253,451.4495590130874
-9122.34375,425.9754819869995,9755.204571723938,9329.229089736938,934.9813733527924
-8633.451171875,310.9917266368866,9335.22876048088,9024.237033843994,598.82581647682
-9151.1357421875,409.308913230896,9791.141710281372,9381.832797050476,915.2787360850705
-8963.8125,385.0273141860962,9624.008870601654,9238.981556415558,454.20380313362966
-9010.8466796875,396.35331869125366,9662.350082874298,9265.996764183044,423.5013329217992
-9149.98046875,413.9875545501709,9789.32989692688,9375.342342376709,457.55751738219664
-9297.533203125,443.95727252960205,9920.519979476929,9476.562706947327,895.291541981769
-9056.1357421875,369.66988945007324,9721.56536102295,9351.895471572876,414.7025735197229
-8894.49609375,319.95665979385376,9585.196269512177,9265.239609718323,424.29444105736076
-8715.26171875,323.37777638435364,9409.586423635483,9086.20864725113,615.9957480171395
-8625.7587890625,212.05909848213196,9372.921648263931,9160.8625497818,436.1866778964252
-9206.78125,411.5896940231323,9848.34395980835,9436.754265785217,493.98481906606554
-8484.7685546875,115.92922079563141,9280.148151278496,9164.218930482864,629.2961622102089
-8986.8330078125,375.232414662838,9653.413489162922,9278.181074500084,1463.3727178092026
-9226.3330078125,419.3465404510498,9864.641655921936,9445.295115470886,1039.3121388150457
-9288.01953125,414.04976511001587,9926.401027202606,9512.35126209259,383.61891273592795
-9071.189453125,371.1807737350464,9736.551104545593,9365.370330810547,1411.4032790412666
-8885.291015625,274.05799436569214,9599.723132610321,9325.665138244629,429.3967776440304
-9292.2626953125,415.7949457168579,9931.880563735962,9516.085618019104,1415.5993557656484
-9298.046875,412.8832893371582,9936.860873222351,9523.977583885193,412.2270846661808
-9253.2431640625,391.94869232177734,9903.844420433044,9511.895728111267,408.4400384757352
-9244.22265625,393.9455337524414,9897.489090919495,9503.543557167053,839.1666037051842
-8987.76171875,320.90266025066376,9677.265532970428,9356.362872719765,1824.2627353525945
-9293.4169921875,398.5760307312012,9939.044553756714,9540.468523025513,486.9216944379579
-9348.7421875,387.58557987213135,10000.54045009613,9612.954870223999,1397.8741563847302
-9146.6640625,343.69538486003876,9823.960786700249,9480.26540184021,907.4670129172888
-9537.2060546875,441.38272857666016,10157.00284576416,9715.6201171875,1182.072119604984
-9366.517578125,401.24039936065674,10010.588949203491,9609.348549842834,442.1544713330103
-9275.05859375,391.6687879562378,9929.869893074036,9538.201105117798,947.9586217962418
-9311.228515625,397.4691524505615,9960.543937683105,9563.074785232544,672.988625173726
-9085.3056640625,348.2910417318344,9762.229642868042,9413.938601136208,465.93848188509816
-8599.537109375,-11.208929538726807,9446.977420330048,9458.186349868774,6884.7689374879865
-9633.2783203125,445.36337089538574,10248.740524291992,9803.377153396606,845.0185291873563
-9154.16796875,349.0947559028864,9831.810807481408,9482.716051578522,1963.9731468955779
-9096.451171875,294.11925172805786,9797.292458057404,9503.173206329346,1021.1824542917249
-9514.724609375,392.8486433029175,10160.740216255188,9767.89157295227,1153.8863047508964
-9406.88671875,410.3525457382202,10047.195000648499,9636.842454910278,792.0231421686486
-9438.033203125,385.93034172058105,10087.324527740479,9701.394186019897,481.25074689526906
-9155.4619140625,310.2621717453003,9849.71185874939,9539.44968700409,927.1038315881078
-9669.9375,429.55033111572266,10292.328705787659,9862.778374671936,857.2199415683498
-9116.3271484375,304.6950731873512,9817.787190675735,9513.092117488384,496.86691477953497
-8780.576171875,178.9755368232727,9545.077342033386,9366.101805210114,817.2171128574117
-9009.7861328125,286.99006575345993,9718.20452928543,9431.214463531971,949.6983064232747
-9534.892578125,377.0529441833496,10189.756778717041,9812.703834533691,628.0754214838759
-9180.119140625,293.4700126647949,9883.837936401367,9590.367923736572,1070.352627519
-9575.76171875,400.24177646636963,10216.376492500305,9816.134716033936,1038.5157883326722
-9169.779296875,231.22868698835373,9898.454721152782,9667.226034164429,6997.571131762759
-9297.0107421875,342.82752352952957,9974.716198265553,9631.888674736023,1133.7229798287901
-9668.3173828125,419.10508728027344,10299.888704299927,9880.783617019653,1385.3691643580914
-9314.490234375,336.4559717178345,9992.35230588913,9655.896334171295,1088.3114696798264
-9109.5263671875,285.6131453514099,9818.597216129303,9532.984070777893,983.4920389431009
-9519.0673828125,353.9197506904602,10184.515278816223,9830.595528125763,1490.3218216710807
-8875.9228515625,96.67063879966736,9674.96831870079,9578.297679901123,5909.009999276281
-9367.291015625,361.5845568180084,10038.445615530014,9676.861058712006,895.9821268813057
-8824.5478515625,177.98484563827515,9594.158296108246,9416.17345046997,904.1071403462688
-9432.029296875,371.6082682609558,10094.264180660248,9722.655912399292,2836.899330851602
-9055.2392578125,151.86524486541748,9824.431010246277,9672.56576538086,1448.1279833318385
-9261.6171875,321.2072911262512,9952.602659702301,9631.39536857605,1164.7255941190238
-9764.56640625,405.6882200241089,10398.798248291016,9993.110028266907,842.1775030713682
-9366.12109375,325.46289443969727,10050.79055261612,9725.327658176422,1515.4191757803508
-9405.6513671875,228.46369528770447,10130.27847456932,9901.814779281616,1002.7431625800962
-9382.3779296875,310.0733003616333,10074.167079925537,9764.093779563904,1477.7779784433258
-8915.306640625,183.15412712097168,9680.518236637115,9497.364109516144,1204.3511138913939
-9862.595703125,434.5434675216675,10484.008700370789,10049.465232849121,1445.0635647366262
-9723.6904296875,377.468563079834,10374.170545578003,9996.701982498169,1283.0119270879202
-8998.2158203125,75.96412217617035,9805.689927458763,9729.725805282593,851.5617333982073
-9124.8369140625,253.50187921524048,9849.028562545776,9595.526683330536,2279.7098511556196
-8780.91015625,28.234401404857635,9627.639925658703,9599.405524253845,1243.0745904348114
-7362.46826171875,-843.4098992347717,8605.35907125473,9448.768970489502,431.7188014589729
-9020.5087890625,91.47743320465088,9814.765615463257,9723.288182258606,500.02242812691946
-9511.2373046875,372.8794560432434,10172.145854473114,9799.26639842987,950.4539869730941
-9584.8544921875,345.4987587928772,10254.847980976105,9909.349222183228,1802.6490674960291
-9832.5849609375,403.8396825790405,10468.263307571411,10064.42362499237,1488.4197998232878
-8180.00732421875,-383.062283039093,9209.784962177277,9592.84724521637,1916.2890691510668
-9680.5625,334.6431760787964,10346.94786643982,10012.304690361023,2051.3214044092497
-9222.208984375,237.7263657450676,9950.337869942188,9712.61150419712,1110.837748150373
-9526.24609375,359.78507232666016,10192.906100273132,9833.121027946472,1524.7139231976128
-9559.041015625,324.26000595092773,10241.092887878418,9916.83288192749,950.1459314401263
-10027.4873046875,441.5901403427124,10641.682871818542,10200.09273147583,903.6633733163349
-9538.1591796875,334.0688488483429,10217.433398246765,9883.364549398422,995.7534268503085
-8251.9501953125,-216.9423553943634,9215.961534261703,9432.903889656067,2033.4609880078285
-9548.333984375,342.89699935913086,10224.107414245605,9881.210414886475,1926.1191349265328
-9151.0048828125,167.5578417778015,9924.20379447937,9756.645952701569,868.8904138269378
-9063.82421875,162.68135166168213,9825.440154075623,9662.75880241394,948.1580797814325
-9010.6572265625,195.92169857025146,9770.934924960136,9575.013226389885,1475.3989786407535
-8988.5234375,141.45279669761658,9770.366725206375,9628.913928508759,807.5349952463407
-9447.876953125,280.16087436676025,10149.752313613892,9869.591439247131,1571.2422723378077
-9650.041015625,317.0290832519531,10330.915817260742,10013.886734008789,1197.9912824053506
-9212.9775390625,198.86650466918945,9966.353721618652,9767.487216949463,893.4382462114626
-9913.04296875,406.58903408050537,10552.791487693787,10146.202453613281,1010.1836551026732
-8159.3818359375,-164.51662802696228,9129.143725633621,9293.660353660583,1038.739609839932
-7309.796875,-706.1974506378174,8501.581976890564,9207.779427528381,1354.340315051803
-9320.37109375,194.81235885620117,10067.681129455566,9872.868770599365,877.9209619947321
-9425.44921875,323.5424742400646,10113.970385998487,9790.427911758423,5615.862393703345
-9760.1279296875,373.7666301727295,10415.836735248566,10042.070105075836,907.6234017358405
-9791.033203125,333.9747920036316,10463.21389055252,10129.23909854889,1316.4066339815538
-7484.36865234375,-597.0676302909851,8650.372540712357,9247.440171003342,517.2183409474738
-8009.57568359375,-647.9111099243164,9153.906931877136,9801.818041801453,1035.8411209575165
-9330.6181640625,227.78399085998535,10061.675108909607,9833.891118049622,2397.4245480966215
-9870.458984375,387.5719003677368,10512.585457801819,10125.013557434082,1325.5878200472916
-9857.376953125,367.66441917419434,10512.155032634735,10144.49061346054,1593.9738983278228
-9151.732421875,136.96469020843506,9933.97331237793,9797.008622169495,669.4930295614686
-9431.0703125,213.97745943069458,10170.508999347687,9956.531539916992,1101.5497756500295
-9219.228515625,88.5146427154541,10023.243341445923,9934.728698730469,972.991227302835
-9473.380859375,174.53178477287292,10222.797896146774,10048.266111373901,1002.2056351099335
-9662.736328125,275.05346870422363,10361.844386100769,10086.790917396545,999.1167667456124
-9687.11328125,301.5385015010834,10379.172425031662,10077.633923530579,1043.1332184969706
-8445.0654296875,-167.61688697338104,9385.945615887642,9553.562502861023,856.7596326470332
-9687.6923828125,305.23495149612427,10382.683412075043,10077.448460578918,898.3297932685791
-9753.056640625,353.971941947937,10417.524463653564,10063.552521705627,1290.05616014202
-9160.4873046875,82.09521383047104,9975.094040334225,9892.998826503754,888.6165015831288
-8141.94189453125,-282.860910654068,9145.647636175156,9428.508546829224,960.0124450371586
-8183.47314453125,-274.4871747493744,9183.607273817062,9458.094448566437,1269.707218688615
-8647.0771484375,-114.52603197097778,9550.087843894958,9664.613875865936,986.547635374011
-9521.4599609375,274.2437515258789,10232.693858146667,9958.450106620789,1162.1829430331347
-9441.943359375,157.36542415618896,10202.09173488617,10044.72631072998,1045.4036380848627
-7522.06103515625,-539.9211673736572,8674.369870185852,9214.29103755951,1070.8109590210995
-8067.76318359375,-640.0334024429321,9204.899626731873,9844.933029174805,5027.564242342113
-9316.345703125,71.44335448741913,10122.074783205986,10050.631428718567,341.23294573796727
-7845.5546875,-424.2024784088135,8901.812933921814,9326.015412330627,919.8917424171427
-9373.736328125,152.34395790100098,10145.528646469116,9993.184688568115,596.4729319329793
-8253.337890625,-357.34210109710693,9286.707398414612,9644.049499511719,1722.818726804475
-9625.1455078125,209.02129936218262,10355.78542804718,10146.764128684998,512.8813995462574
-8696.6591796875,-31.592583656311035,9575.120850086212,9606.713433742523,1178.6933391374203
