loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,2.626249569442986
-3669.2734375,1009.0371560677886,4185.602802693844,3176.5656466260552,730.6003066458347
-5148.98876953125,383.31303215026855,5718.54935836792,5335.236326217651,564.9455822170524
-5602.630859375,350.3479223251343,6159.525668144226,5809.177745819092,1152.4100591549832
-5846.859375,352.9585065841675,6396.01504611969,6043.0565395355225,2977.934762331819
-6124.23486328125,359.7966785430908,6664.355257987976,6304.558579444885,1346.5621470277385
-6344.18505859375,378.09997367858887,6876.40284538269,6498.302871704102,962.4009361384198
-6541.9375,378.7224359512329,7070.1896505355835,6691.467214584351,861.062583296779
-6640.1796875,380.2329225540161,7166.432431221008,6786.199508666992,643.4124987689188
-6691.935546875,368.29522037506104,7222.939712524414,6854.644492149353,860.1307287488277
-6916.4765625,394.0917139053345,7436.1964654922485,7042.104751586914,864.6081298821994
-7022.4970703125,391.1356086730957,7542.22511100769,7151.089502334595,1463.8134350794571
-7066.24609375,380.71723461151123,7587.894991874695,7207.177757263184,905.6127575020863
-7211.869140625,385.3436555862427,7729.938395500183,7344.59473991394,900.3850786796614
-7244.755859375,382.5412130355835,7764.194979667664,7381.65376663208,852.3965943221327
-7102.8740234375,334.1327347755432,7640.239779472351,7306.107044696808,1368.2159139150137
-7437.9765625,380.1424570083618,7955.96861743927,7575.826160430908,986.7005475776895
-7387.79296875,358.53070878982544,7913.470862865448,7554.940154075623,1219.5460222455147
-7532.72607421875,373.5765018463135,8051.700306892395,7678.1238050460815,876.4519589584971
-7596.2158203125,366.0277519226074,8116.885751724243,7750.857999801636,888.491144252178
-7683.2470703125,372.05586528778076,8201.181482315063,7829.125617027283,957.2489022954966
-7706.3466796875,364.28089141845703,8226.503699302673,7862.222807884216,949.7420318073005
-7722.9794921875,360.06039810180664,8245.079158782959,7885.018760681152,1404.550920891993
-7689.4951171875,332.4154386520386,8221.281416893005,7888.865978240967,892.3243809997733
-7854.54345703125,356.4557456970215,8374.946455955505,8018.490710258484,1063.3579229489008
-7488.4560546875,264.2498928308487,8045.716679215431,7781.4667863845825,1046.1045166144547
-7990.61083984375,340.7388277053833,8513.1768283844,8172.438000679016,2125.3852890473113
-7805.3154296875,317.89496326446533,8341.679697036743,8023.784733772278,953.1329512025352
-8033.81640625,343.7186155319214,8555.773782730103,8212.055167198181,1012.4515281160508
-8013.7001953125,327.0272822380066,8542.561064243317,8215.53378200531,466.28194386128877
-8038.2548828125,322.2416944503784,8567.826234817505,8245.584540367126,907.0369808833168
-8170.208984375,337.77618408203125,8692.619828224182,8354.84364414215,958.3460544349389
-8069.3017578125,311.3045606613159,8602.691187858582,8291.386627197266,3863.8737151293917
-8282.25,331.04494857788086,8804.136909484863,8473.091960906982,1419.4031325247408
-8096.810546875,315.94582080841064,8630.296451568604,8314.350630760193,1601.615293530049
-8294.126953125,325.54654121398926,8819.18219089508,8493.635649681091,871.082933845196
-8361.2431640625,324.646107673645,8885.568002700806,8560.92189502716,4263.309645129217
-8351.998046875,319.7723903656006,8877.030390739441,8557.25800037384,843.3855687850302
-8300.3134765625,297.4135785102844,8835.63069486618,8538.217116355896,1420.206749941855
-8399.8681640625,310.6560754776001,8928.244571685791,8617.588496208191,866.4077805626782
-8424.9384765625,316.51603984832764,8952.490635871887,8635.97459602356,2056.7437937016925
-8425.86328125,288.1748867034912,8962.057107925415,8673.882221221924,996.6537408468741
-8412.0205078125,310.9762144088745,8941.551203727722,8630.574989318848,925.8159907669096
-8550.388671875,317.2961616516113,9075.460186958313,8758.164025306702,647.5974614668115
-8429.3125,276.37791299819946,8971.073713302612,8694.695800304413,1432.248924552655
-8626.39453125,325.02071380615234,9148.28818321228,8823.267469406128,919.0488128920421
-8400.2099609375,254.09956431388855,8948.300827741623,8694.201263427734,614.2043275930832
-8505.373046875,273.75085830688477,9046.009223937988,8772.258365631104,3552.970554111754
-8576.8759765625,281.57038497924805,9113.797348976135,8832.226963996887,842.0993533115358
-8647.19140625,305.0297317504883,9177.639015197754,8872.609283447266,1978.8959121091414
-8710.8701171875,302.8761672973633,9239.030472755432,8936.154305458069,824.4917238982953
-8605.9970703125,292.3696622848511,9140.443124294281,8848.07346200943,915.4307921996314
-8666.4140625,299.5524673461914,9198.309562683105,8898.757095336914,2577.614210268451
-8652.3935546875,294.2900609970093,9186.182493209839,8891.89243221283,825.1627436558132
-8578.1669921875,256.08603858947754,9124.00972366333,8867.923685073853,901.8076186596508
-8772.6484375,290.95339012145996,9304.945368766785,9013.991978645325,1223.546328703467
-8902.91015625,321.36603450775146,9422.126418113708,9100.760383605957,674.8600299589464
-8831.4326171875,296.7771021127701,9360.464686751366,9063.687584638596,1257.696366471845
-8680.3515625,282.45418643951416,9217.478813171387,8935.024626731873,853.291132957761
-8839.1064453125,300.8899688720703,9366.577363014221,9065.68739414215,5463.805095682179
-8592.4140625,224.2171859741211,9150.773078918457,8926.555892944336,848.2658631229037
-8931.4541015625,311.4509696960449,9456.730108261108,9145.279138565063,3796.654480924503
-8506.572265625,206.2888303771615,9071.743296094239,8865.454465717077,1291.3656397872505
-9057.2255859375,321.4365348815918,9576.202465057373,9254.765930175781,837.7010282514805
-8914.830078125,285.93364334106445,9447.421423912048,9161.487780570984,1354.1137748113356
-8377.658203125,146.76178455352783,8963.332233428955,8816.570448875427,811.8994267209439
-9007.533203125,326.42545318603516,9527.761449813843,9201.335996627808,6154.490238272312
-8960.078125,303.52847385406494,9487.281343460083,9183.752869606018,6007.994802338412
-8908.6162109375,283.4052808880806,9443.434970676899,9160.029689788818,1474.8159883210906
-9176.6494140625,316.6611022949219,9694.860095977783,9378.198993682861,631.393615380063
-9161.130859375,326.5780830383301,9677.291093826294,9350.713010787964,641.1028874025874
-9092.2041015625,298.11658668518066,9617.88446521759,9319.76787853241,1786.8032616764076
-8993.2001953125,280.382688999176,9528.654877185822,9248.272188186646,643.6466518828377
-9228.994140625,330.75074672698975,9744.449136734009,9413.698390007019,1479.0879662884367
-9236.244140625,332.009952545166,9750.88870048523,9418.878747940063,5425.878187382761
-8987.943359375,272.04798698425293,9526.159627914429,9254.111640930176,5015.434399789829
-9139.7724609375,298.5331869125366,9667.245443344116,9368.71225643158,1582.997957878729
-9031.61328125,268.4708490371704,9569.735711097717,9301.264862060547,6760.736445284023
-9197.6982421875,311.5936155319214,9719.98197555542,9408.388360023499,860.6454959895167
-9177.1591796875,297.44858837127686,9703.985311508179,9406.536723136902,2970.80066275685
-9216.7470703125,309.35328674316406,9740.590406417847,9431.237119674683,2165.773538190763
-9007.888671875,266.8220315426588,9546.92002491653,9280.09799337387,959.9133205084113
-9208.83203125,293.7864456176758,9736.633425712585,9442.84698009491,1596.6649934352909
-9150.798828125,302.3740882873535,9679.523509025574,9377.14942073822,6276.059081628086
-9332.3408203125,317.62047386169434,9850.878128051758,9533.257654190063,2710.82111373922
-9292.8740234375,298.6807737350464,9820.078435897827,9521.39766216278,1882.6794155922378
-9023.65234375,216.78801381587982,9578.513266444206,9361.725252628326,1841.8288709882895
-8976.8818359375,244.82043993473053,9526.141981720924,9281.321541786194,1108.7504704009093
-9227.83203125,282.7969036102295,9760.647024154663,9477.850120544434,4369.905596452749
-9354.361328125,304.7709791660309,9879.44137430191,9574.67039513588,3129.225201943698
-9135.5654296875,267.455295085907,9673.51061296463,9406.055317878723,1405.4728404990274
-9326.3427734375,314.54980182647705,9847.365675926208,9532.815874099731,856.1108379926566
-9301.4111328125,298.0582015514374,9827.818506479263,9529.760304927826,909.3398933748574
-9442.67578125,330.88512325286865,9958.871102333069,9627.9859790802,828.507040066571
-9053.974609375,218.90790462493896,9610.678825378418,9391.770920753479,3180.553977704812
-9140.3291015625,262.7211618423462,9683.079526901245,9420.358365058899,6033.900368104986
-9533.994140625,344.2636528015137,10042.29104232788,9698.027389526367,1314.1579099012097
-9038.8388671875,230.38757991790771,9592.27230000496,9361.884720087051,3230.098490417412
-9527.9423828125,334.8734130859375,10040.356686592102,9705.483273506165,2105.8915173412
-9121.4951171875,252.51096715033054,9668.193247929215,9415.682280778885,1253.554276168739
-9064.380859375,213.79389917850494,9622.543377995491,9408.749478816986,3122.1754108758837
-8933.5771484375,153.03881260752678,9516.75088879466,9363.712076187134,3511.219044018927
-9308.544921875,291.7296676635742,9837.296029090881,9545.566361427307,2417.4112038175736
-9254.5869140625,266.9249143600464,9793.45215511322,9526.527240753174,848.9890543718378
-9310.083984375,283.1313066482544,9845.117336273193,9561.986029624939,3989.808502068067
-9228.583984375,253.07469528913498,9773.13605850935,9520.061363220215,2391.490295795988
-9377.7802734375,292.8202408179641,9908.522015415132,9615.701774597168,1798.830315291466
-9076.17578125,202.1544487476349,9637.950404167175,9435.79595541954,2241.216750700937
-9410.6806640625,278.49381589889526,9943.433646678925,9664.93983078003,1128.389857124737
-9541.5458984375,317.8474245071411,10061.177759170532,9743.330334663391,3789.183545274736
-9504.7705078125,319.86754035949707,10023.81071472168,9703.943174362183,1439.8005791485048
-9083.5693359375,135.5031042098999,9665.648917198181,9530.145812988281,1505.2236532279453
-9221.802734375,232.4051730632782,9775.738573789597,9543.333400726318,6392.583663969598
-9465.8056640625,300.88797187805176,9990.496963500977,9689.608991622925,857.0425091027136
-9599.8837890625,319.39699935913086,10117.201906204224,9797.804906845093,3098.7447200691768
-9516.8330078125,303.86850929260254,10041.740048408508,9737.871539115906,1463.7633547436715
-9151.9365234375,158.34365558624268,9727.354962825775,9569.011307239532,2738.074248977676
-9252.4853515625,220.39801859855652,9808.582874536514,9588.184855937958,4580.348078486278
-9576.4736328125,295.7647762298584,10103.110306739807,9807.345530509949,1380.276706013512
-9635.7353515625,319.6136302947998,10154.563239097595,9834.949608802795,1941.3058835817606
-9564.630859375,312.04590702056885,10088.668900966644,9776.622993946075,2401.9246247287515
-9430.931640625,269.88497734069824,9968.629546165466,9698.744568824768,1516.2242416998972
-9692.7099609375,319.4641065597534,10210.328997612,9890.864891052246,883.0509758025208
-8644.697265625,-4.233156859874725,9283.136369526386,9287.369526386261,4062.4817503911745
-9717.810546875,306.8183307647705,10238.195943832397,9931.377613067627,1247.9632203528133
-9505.12890625,277.4965509176254,10038.63110768795,9761.134556770325,2819.835808370265
-9052.7431640625,89.46744322776794,9654.68477511406,9565.217331886292,1395.204439732227
-9716.1181640625,314.5871982574463,10233.679162979126,9919.09196472168,5991.363749127073
-9370.4189453125,260.9049277305603,9911.795469760895,9650.890542030334,4226.164899511895
-9718.646484375,313.0268259048462,10237.810063362122,9924.783237457275,1011.6735350027026
-9692.943359375,331.9111576080322,10207.864103794098,9875.952946186066,3539.2533213803636
-8921.619140625,71.54202842712402,9532.176160812378,9460.634132385254,1043.1154422157274
-9600.5263671875,287.8375678062439,10130.798991680145,9842.961423873901,1389.8749277716317
-9931.732421875,357.3725337982178,10433.673309326172,10076.300775527954,808.6993092369974
-9392.5869140625,237.1896939277649,9941.33254289627,9704.142848968506,1326.4616638085631
-9746.703125,313.0995969772339,10265.884063720703,9952.78446674347,2770.9236528013225
-9272.099609375,198.9444169998169,9835.631249427795,9636.686832427979,1191.9129522146386
-9483.6552734375,227.13249588012695,10034.699385643005,9807.566889762878,5418.838885566422
-9466.1455078125,241.65706157684326,10011.655029296875,9769.997967720032,928.3463998704468
-9313.0576171875,195.24236583709717,9878.357595443726,9683.115229606628,3850.3006238477274
-9706.0322265625,323.82600021362305,10222.661897659302,9898.835897445679,1240.9097587665728
-9540.818359375,277.3928337097168,10077.048429965973,9799.655596256256,2869.0369700245215
-9755.8857421875,296.0157480239868,10280.469939231873,9984.454191207886,1635.7375323592048
-9870.072265625,322.77931690216064,10385.713528633118,10062.934211730957,2092.0266504716656
-9479.6044921875,223.71465289592743,10030.040195345879,9806.325542449951,2289.816248921032
-9768.52734375,304.7618474960327,10290.018417358398,9985.256569862366,3310.54832244154
-9796.439453125,311.5633087158203,10316.864850997925,10005.301542282104,2262.844400328568
-9611.126953125,235.24111461639404,10156.153804779053,9920.912690162659,2104.2506557582838
-9780.328125,299.11489725112915,10304.660339832306,10005.545442581177,1877.8260696960865
-9713.4560546875,279.6285343170166,10244.046695709229,9964.418161392212,1681.180361102153
-9635.7412109375,213.7887887954712,10189.254338264465,9975.465549468994,844.8287013514978
-9464.6435546875,145.99190020561218,10044.242846250534,9898.250946044922,1315.8673867845564
-9526.345703125,193.66004014015198,10085.035108327866,9891.375068187714,1318.6889477466834
-9333.611328125,159.04986321926117,9908.278801321983,9749.228938102722,2688.427334925755
-8598.220703125,-299.79641312360764,9323.773390352726,9623.569803476334,846.6490676291619
-9739.1142578125,285.1331968307495,10268.08620262146,9982.95300579071,3119.87677910299
-9041.798828125,63.69142550230026,9654.61674439907,9590.92531889677,4008.864903181959
-9940.9833984375,329.08476161956787,10454.20219707489,10125.117435455322,3354.888014941827
-9809.6103515625,285.70599937438965,10339.505259513855,10053.799260139465,876.290754918754
-9783.9140625,264.0808210372925,10319.163365364075,10055.082544326782,2294.6549755819547
-9846.638671875,295.93311977386475,10372.08131313324,10076.148193359375,2015.087757982295
-9685.017578125,196.61843967437744,10242.761041641235,10046.142601966858,1026.1345254502917
-9654.3369140625,230.9449224472046,10201.25087928772,9970.305956840515,3514.474070057322
-10022.7041015625,334.3236837387085,10532.328391075134,10198.004707336426,2947.110824947768
-9367.5751953125,123.19404339790344,9956.43747329712,9833.243429899216,938.1663011755961
-9456.681640625,199.8157856464386,10018.113931894302,9818.298146247864,2906.024372578414
-10107.880859375,327.16976737976074,10618.854400634766,10291.684633255005,4147.6259041672465
-9986.705078125,311.22697591781616,10505.878285884857,10194.651309967041,1287.3848103963867
-9841.720703125,261.6803479194641,10378.203564167023,10116.523216247559,4258.012255297353
-9985.830078125,309.4789276123047,10506.590957641602,10197.112030029297,1085.829932735344
-9558.099609375,101.97588348388672,10144.67171573639,10042.695832252502,6709.280306487753
-9804.998046875,272.9123158454895,10339.101150989532,10066.188835144043,6458.632827959224
-9823.896484375,279.7788197994232,10354.568268537521,10074.789448738098,1534.4936477530782
-9661.4326171875,203.1449418067932,10219.36202955246,10016.217087745667,1370.1664567404914
-9706.0400390625,193.95903635025024,10265.273532390594,10071.314496040344,2522.047273021163
-9770.4482421875,248.3296160697937,10313.370884418488,10065.041268348694,6755.161263286878
-9927.466796875,258.8869318962097,10464.55218410492,10205.66525220871,1073.1988355064752
-9535.8251953125,212.4112057685852,10092.978248119354,9880.567042350769,1326.332113188438
-9201.548828125,5.098648428916931,9828.069856524467,9822.97120809555,911.5833688619811
-9270.962890625,85.99709725379944,9872.752714395523,9786.755617141724,1046.2820651685074
-9692.169921875,211.04752206802368,10246.963485240936,10035.915963172913,1553.5789140799288
-10032.08203125,307.9037961959839,10552.488561630249,10244.584765434265,1234.6236776120045
-9854.6611328125,261.21619479358196,10391.812134742737,10130.595939949155,1793.076567876654
-9785.6689453125,194.78129935264587,10346.475317716599,10151.694018363953,1097.3926780229706
-9374.7822265625,102.51809775829315,9968.342154860497,9865.824057102203,6941.704653325877
-10163.8232421875,341.1293239593506,10672.568641662598,10331.439317703247,1164.479177860833
-9250.1123046875,-49.14993979781866,9892.623420454562,9941.77336025238,3167.378820313892
-9980.3447265625,282.99380445480347,10509.47927236557,10226.485467910767,1147.948168340829
-9896.080078125,263.1853151321411,10432.239043235779,10169.053728103638,6665.855158795573
-9743.1044921875,192.68731212615967,10303.1441116333,10110.456799507141,1885.4653515102161
-10104.986328125,291.1165895462036,10630.582733154297,10339.466143608093,1042.5368068988794
-9525.328125,171.9342098236084,10097.757668495178,9925.82345867157,1487.233937589312
-10035.9326171875,284.15080404281616,10564.981215000153,10280.830410957336,1858.0723107571762
-9350.1181640625,95.97916662693024,9948.210044503212,9852.230877876282,6193.553451630088
-9969.923828125,275.67211055755615,10502.479824066162,10226.807713508606,5815.142151591974
-9413.51171875,121.85093677043915,10006.735244870186,9884.884308099747,2435.120052043051
-10253.48046875,313.1906147003174,10769.506954193115,10456.316339492798,4145.395631902122
-9698.064453125,226.22808599472046,10251.446214675903,10025.218128681183,1458.44773779587
-9258.794921875,-2.36419415473938,9887.919171571732,9890.283365726471,2578.0688534306328
-9554.7939453125,127.5792704820633,10149.307314515114,10021.72804403305,2121.8994716946668
-9093.900390625,-161.56281328201294,9772.204561710358,9933.76737499237,6373.355064131716
