loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,6.460298400576367
-4010.5693359375,845.6584406988695,4394.246755917557,3548.588315218687,417.3668317757262
-5478.9091796875,187.61309909820557,5910.209952354431,5722.596853256226,1625.2912950333427
-5858.3671875,142.41172122955322,6291.27799987793,6148.8662786483765,1187.6135419316408
-6177.20849609375,109.52699565887451,6611.610248565674,6502.083252906799,2150.1371697488394
-6422.18994140625,105.00753116607666,6855.227313041687,6750.21978187561,1077.3817381397246
-6550.5029296875,108.17246913909912,6982.881105422974,6874.7086362838745,575.9775874872443
-6731.06298828125,109.09636306762695,7162.505317687988,7053.408954620361,1321.548033283662
-6852.15087890625,96.68016052246094,7285.546325683594,7188.866165161133,581.2239015001225
-6998.5849609375,98.11749744415283,7430.092923164368,7331.975425720215,585.6259828915431
-7060.14501953125,92.17703437805176,7492.649487495422,7400.472453117371,2275.098505307403
-7203.2080078125,102.82172966003418,7633.375316619873,7530.553586959839,1272.7114594392272
-7224.865234375,95.47877025604248,7657.169890403748,7561.691120147705,1106.8055808551971
-7354.9794921875,100.5695571899414,7786.009150505066,7685.4395933151245,647.8199333844319
-7435.0263671875,97.47560119628906,7865.720383644104,7768.244782447815,1344.6548117195366
-7458.21923828125,90.55140209197998,7889.618779182434,7799.067377090454,845.9657626989361
-7553.20654296875,90.80238342285156,7984.64098072052,7893.8385972976685,904.9926700378621
-7560.5439453125,82.73159885406494,7993.440967559814,7910.7093687057495,1253.4082392806836
-7448.61962890625,47.271087646484375,7888.75044965744,7841.479362010956,876.0786892616755
-7657.1015625,93.35712909698486,8087.477189064026,7994.120059967041,2417.508370939237
-7746.66015625,75.91407775878906,8178.574507713318,8102.660429954529,839.4402442743275
-7776.337890625,77.85047245025635,8208.8486328125,8130.998160362244,1027.4975939154504
-7687.77978515625,46.12740683555603,8125.770799398422,8079.643392562866,2712.43879429678
-7839.5966796875,89.74020671844482,8269.776231765747,8180.036025047302,997.6116376603351
-7884.27294921875,78.02910804748535,8316.36801815033,8238.338910102844,1025.552293429725
-7937.78125,81.20319271087646,8368.860555648804,8287.657362937927,862.7663191003229
-8013.84423828125,74.66765308380127,8445.234398841858,8370.566745758057,864.3792936878998
-7906.2431640625,54.2658896446228,8342.218250751495,8287.952361106873,1849.8013907940401
-8051.7734375,83.78284168243408,8481.852838516235,8398.069996833801,1721.9109740584424
-8083.6630859375,66.70416069030762,8515.412887573242,8448.708726882935,1194.0462316348119
-8051.39599609375,64.90233707427979,8484.905086517334,8420.002749443054,1052.1406828801194
-7941.77001953125,45.54175519943237,8379.56087398529,8334.019118785858,994.1256932129668
-8199.8623046875,70.66773509979248,8631.190442085266,8560.522706985474,911.6949666916634
-8101.912109375,51.194507122039795,8537.511532306671,8486.317025184631,2464.968048433694
-8132.07177734375,42.764174938201904,8568.969175815582,8526.20500087738,875.1902298277915
-8278.486328125,76.88850593566895,8708.39864730835,8631.51014137268,2667.1576388126805
-8215.681640625,53.725565910339355,8650.412524223328,8596.686958312988,1007.4010307766686
-8283.0400390625,65.04393863677979,8715.1169090271,8650.07297039032,960.8659074188697
-8267.6162109375,47.298593521118164,8702.985586166382,8655.686992645264,1064.662587711428
-8378.232421875,61.71088409423828,8809.676038742065,8747.965154647827,1549.3759258588161
-8329.33984375,56.063082695007324,8763.03030014038,8706.967217445374,2418.003542038407
-8345.099609375,59.740623474121094,8778.147477149963,8718.406853675842,892.7487832323321
-8463.6220703125,59.767319679260254,8895.422596931458,8835.655277252197,1435.4268185972373
-8385.70703125,53.683226585388184,8819.585746765137,8765.902520179749,1096.0161694945186
-8500.384765625,55.07706546783447,8932.872016906738,8877.794951438904,2386.4537078398675
-8446.2216796875,46.41763114929199,8880.610747337341,8834.19311618805,2023.0232197515634
-8489.4931640625,46.01797389984131,8922.910663604736,8876.892689704895,2818.211558595231
-8500.5478515625,60.6785831451416,8933.058097839355,8872.379514694214,1931.3190921694165
-8557.24609375,49.2726354598999,8989.985333442688,8940.712697982788,3565.416300162022
-8585.6015625,56.4730224609375,9017.538133621216,8961.065111160278,2125.55121953559
-8652.5712890625,59.92919921875,9083.095077514648,9023.165878295898,1718.6995970648695
-8411.4853515625,4.506310939788818,8853.196218967438,8848.689908027649,1051.7783791796453
-8626.6171875,53.165764808654785,9058.675746917725,9005.50998210907,1829.7252923816384
-8434.880859375,25.274643898010254,8874.005679130554,8848.731035232544,1710.0272167339435
-8676.14453125,47.582895278930664,9109.398320198059,9061.815424919128,1002.6978747282585
-8534.0849609375,17.939079761505127,8972.660321235657,8954.721241474152,973.1322250891645
-8714.1279296875,56.07024669647217,9145.85338306427,9089.783136367798,1100.9339971829618
-8651.6865234375,45.24332904815674,9085.588701248169,9040.345372200012,1909.658304362362
-8745.533203125,57.14090824127197,9176.456089019775,9119.315180778503,2634.2547984563375
-8770.498046875,54.83945846557617,9201.983446121216,9147.14398765564,3439.2353327606247
-8795.6455078125,55.10046672821045,9227.05230998993,9171.951843261719,1014.1091497409446
-8664.248046875,9.261682152748108,9104.038830399513,9094.777148246765,4209.270306839045
-8783.90625,40.37242603302002,9217.504976272583,9177.132550239563,4439.749864247508
-8391.494140625,-62.251410365104675,8845.100331902504,8907.351742267609,1555.4118607529633
-8824.916015625,56.38662528991699,9256.225555419922,9199.838930130005,1373.7134875769968
-8906.7119140625,51.06348705291748,9338.12694644928,9287.063459396362,1042.6486104693902
-8888.064453125,49.81363105773926,9319.9723072052,9270.158676147461,1002.8984267108075
-8879.0263671875,39.17004585266113,9312.454916000366,9273.284870147705,2192.6612842273034
-8902.8505859375,46.33918476104736,9334.983701705933,9288.644516944885,1372.2837506039648
-8963.92578125,46.84591007232666,9395.734246253967,9348.88833618164,919.0890599553601
-8873.0263671875,21.963783264160156,9309.126693725586,9287.162910461426,2280.7584627858005
-8960.5224609375,34.224674224853516,9393.891542434692,9359.666868209839,3023.85758908626
-8914.3603515625,21.702457427978516,9350.677313804626,9328.974856376648,1641.2035749504007
-9014.361328125,36.12852668762207,9447.044891357422,9410.9163646698,2004.6390811540768
-8942.3544921875,24.980080604553223,9377.696284294128,9352.716203689575,4203.433122461916
-8985.8486328125,25.451361656188965,9421.143586158752,9395.692224502563,2522.997566098034
-9018.8701171875,28.086170196533203,9453.094198226929,9425.008028030396,1151.745314906298
-9092.8603515625,40.899033546447754,9524.519865989685,9483.620832443237,1571.8929792116166
-8632.08984375,-102.82421922683716,9090.472694396973,9193.29691362381,1418.3713571247215
-9084.8603515625,31.158846855163574,9518.367001533508,9487.208154678345,1785.4837073906576
-8923.4609375,3.922759771347046,9363.465039014816,9359.54227924347,1036.7079219953196
-9110.5595703125,24.593913078308105,9545.624731063843,9521.030817985535,1066.2829965557155
-9050.2744140625,26.55527687072754,9485.201780319214,9458.646503448486,1064.7838909758852
-9110.9130859375,29.488539695739746,9545.223029136658,9515.734489440918,1955.3354244381512
-9014.890625,-1.4666633605957031,9455.035038948059,9456.501702308655,1215.4872128923982
-9167.642578125,36.13840198516846,9600.584949493408,9564.44654750824,1610.5449502396564
-8936.9541015625,-19.93076229095459,9380.819731712341,9400.750494003296,1916.6197176890928
-9227.28515625,30.454622268676758,9660.102180480957,9629.64755821228,1064.4465716930174
-9131.1357421875,8.469141006469727,9568.279742240906,9559.810601234436,1605.91020322576
-9064.32421875,-16.99587059020996,9506.957980155945,9523.953850746155,2377.986203382629
-9000.0751953125,-5.451986312866211,9440.72477054596,9446.176756858826,921.7294765853358
-9209.05078125,17.186108589172363,9644.522185325623,9627.33607673645,872.1030536795474
-9244.1484375,31.01807403564453,9677.270637512207,9646.252563476562,1928.4690601615778
-9130.541015625,13.059702023863792,9567.489753589034,9554.43005156517,4386.484650933082
-9290.6103515625,34.56532001495361,9723.035634040833,9688.470314025879,1659.316086239818
-9127.07421875,1.335759162902832,9566.172198295593,9564.83643913269,3611.1255596124697
-9251.3125,20.06658363342285,9686.425377845764,9666.358794212341,3324.55387988912
-9338.4208984375,33.37393760681152,9770.427137374878,9737.053199768066,1767.748228077212
-9238.15234375,18.9062442779541,9673.721155166626,9654.814910888672,2236.3571066517493
-9010.1142578125,-54.770968437194824,9460.056404590607,9514.827373027802,1139.139033843427
-9165.50390625,-4.3385796546936035,9604.415001392365,9608.753581047058,803.2853788311335
-9339.6455078125,28.06082820892334,9773.157719612122,9745.096891403198,970.3820686801017
-9401.0380859375,38.6323184967041,9832.055213928223,9793.422895431519,1385.6376956323181
-9102.55859375,-39.97260570526123,9548.37754535675,9588.350151062012,857.4960865553568
-9374.353515625,29.551575660705566,9807.097304344177,9777.545728683472,1518.6040116311688
-9322.568359375,1.304804801940918,9760.382571220398,9759.077766418457,4124.293880465313
-9303.04296875,-1.1210412979125977,9740.97473526001,9742.095776557922,834.0316514291771
-9264.9619140625,-6.3870744705200195,9705.188526153564,9711.575600624084,1716.2286124162722
-9293.58984375,-4.920519828796387,9732.953272819519,9737.873792648315,1225.0270576262772
-9251.330078125,-6.8115363121032715,9691.079057216644,9697.890593528748,797.4912746394677
-9387.904296875,21.274751663208008,9822.49862575531,9801.223874092102,3542.4345183428723
-9308.41796875,-16.318615913391113,9749.270364761353,9765.588980674744,1182.393307202262
-9381.45703125,9.352595329284668,9818.386458396912,9809.033863067627,2169.5589820666733
-9459.5908203125,25.12649917602539,9892.958902359009,9867.832403182983,2947.9312930294736
-9318.8935546875,-2.6212892532348633,9757.512924194336,9760.13421344757,1545.876059103657
-9002.3232421875,-183.50729703903198,9471.081775188446,9654.589072227478,855.4832623034139
-9329.8037109375,-3.4733896255493164,9768.904502868652,9772.377892494202,875.9019385957523
-9489.7890625,23.884384155273438,9923.977993011475,9900.093608856201,2675.8575178311708
-9401.0810546875,-12.151808738708496,9840.521537780762,9852.67334651947,2730.8418942042344
-9500.8359375,22.612412452697754,9934.46988773346,9911.857475280762,1061.930877046096
-9487.4111328125,12.184454917907715,9923.071782112122,9910.887327194214,888.5336895091459
-9251.6103515625,-50.32317781448364,9699.176953792572,9749.500131607056,1412.6672421768146
-9554.537109375,32.492069244384766,9987.079169273376,9954.587100028992,647.7980482024634
-9308.03515625,-55.64995193481445,9755.650228500366,9811.30018043518,3542.900458370454
-9363.0986328125,-39.926618576049805,9808.27557849884,9848.20219707489,626.5993698529074
-9562.271484375,29.745823860168457,9994.881929397583,9965.136105537415,1129.5759245541417
-9522.66015625,7.883903980255127,9959.113139629364,9951.229235649109,1299.738647685267
-9530.5947265625,-3.225883960723877,9967.878200054169,9971.104084014893,1183.0666884469113
-9488.748046875,-8.153302669525146,9927.572162151337,9935.725464820862,1502.9100156488628
-9637.5283203125,28.26383399963379,10069.878432273865,10041.614598274231,5264.7300908925245
-9405.310546875,-18.719830989837646,9847.42898607254,9866.148817062378,998.195978902944
-9525.056640625,7.618948936462402,9962.0804605484,9954.461511611938,1065.6254892090585
-9590.3515625,9.367332458496094,10026.220513343811,10016.853180885315,1001.5056670445023
-9239.005859375,-125.20546579360962,9698.871755123138,9824.077220916748,1740.3825197968201
-9401.6826171875,-25.33860492706299,9843.99523639679,9869.333841323853,821.9285828060861
-9506.92578125,-25.586556434631348,9948.657215118408,9974.24377155304,3137.4441259064424
-9638.533203125,19.978781700134277,10072.639597892761,10052.660816192627,2100.09315545027
-9652.923828125,20.159597396850586,10086.677230834961,10066.51763343811,2178.1937536236514
-9640.4765625,4.915700912475586,10076.159679412842,10071.243978500366,3382.583911620377
-9516.6728515625,-52.74482440948486,9962.116396903992,10014.861221313477,4376.368142787875
-9406.88671875,-48.30573272705078,9852.894229888916,9901.199962615967,1573.7341853836213
-9713.7568359375,22.95114231109619,10146.92610836029,10123.974966049194,887.8635588425232
-9581.0,-17.551486015319824,10021.727993011475,10039.279479026794,1149.2574268208639
-9685.064453125,6.32520866394043,10121.060552597046,10114.735343933105,5034.242440418153
-9573.48828125,-27.80011558532715,10015.506223678589,10043.306339263916,1099.3237457492548
-9338.580078125,-107.84285020828247,9794.369065761566,9902.211915969849,1292.068768943892
-9700.7587890625,4.526921272277832,10137.054871559143,10132.527950286865,1450.6561245409769
-9762.69140625,15.870904922485352,10196.692474365234,10180.821569442749,1661.4694337195979
-9728.435546875,13.484184265136719,10163.272599220276,10149.78841495514,1476.4534853726038
-9562.02734375,-18.770965099334717,10003.23742055893,10022.008385658264,3538.2952432134457
-9338.5126953125,-115.70360517501831,9795.655646800995,9911.359251976013,869.4406287700233
-9831.3134765625,23.72282886505127,10263.618767738342,10239.895938873291,2185.494601343989
-9279.0185546875,-136.60489177703857,9740.585566520691,9877.19045829773,555.3115615776343
-9683.490234375,-5.631714344024658,10121.734212398529,10127.365926742554,1531.8288561806958
-9340.5595703125,-145.69305419921875,9802.566638946533,9948.259693145752,691.3199862745784
-9844.13671875,34.57664489746094,10275.287244796753,10240.710599899292,2295.8640900273876
-9727.447265625,-3.44449520111084,10165.168329238892,10168.612824440002,1153.9868176154343
-9699.58203125,-19.35520029067993,10140.326038837433,10159.681239128113,1886.1451874053414
-9710.521484375,-23.901968002319336,10151.252449035645,10175.154417037964,1055.6634635538528
-9353.8525390625,-99.56438505649567,9809.62651336193,9909.190898418427,1045.6450021743915
-9872.8056640625,20.31014633178711,10305.647985458374,10285.337839126587,2554.1138642351657
-9714.4580078125,-38.41932487487793,10157.024900436401,10195.44422531128,1459.023825449933
-9756.0849609375,-32.504852294921875,10197.698974609375,10230.203826904297,3249.4917118896533
-9504.5087890625,-146.31304049491882,9965.194653749466,10111.507694244385,2528.268441304896
-9662.6240234375,-33.53652763366699,10106.041282653809,10139.577810287476,1834.652711449386
-9712.45703125,-21.55058217048645,10152.512099027634,10174.06268119812,766.778581204639
-9699.087890625,-27.75319242477417,10141.145726680756,10168.89891910553,1155.88904930694
-9512.662109375,-103.75529599189758,9967.730686903,10071.485982894897,1672.951439537208
-9863.3681640625,-10.476228713989258,10301.373699188232,10311.849927902222,1043.4907146090798
-9804.546875,-27.17148494720459,10245.034657478333,10272.206142425537,763.2047842122959
-9810.1982421875,-29.457777976989746,10252.054162979126,10281.511940956116,1158.437783208729
-9333.6064453125,-166.68152123689651,9800.72113865614,9967.402659893036,1239.424989058409
-9856.435546875,-20.822620391845703,10296.332263946533,10317.154884338379,1010.9032188892327
-9806.5732421875,-18.915459632873535,10245.877397537231,10264.792857170105,1129.2728910453209
-9345.134765625,-212.12805080413818,9818.35814666748,10030.486197471619,2476.758504647923
-9674.5244140625,-59.43940448760986,10121.12049293518,10180.55989742279,908.9131789711305
-9754.376953125,-44.58864879608154,10198.459022521973,10243.047671318054,856.8431082671941
-9993.1220703125,16.937564849853516,10426.066654205322,10409.129089355469,1631.7604020737158
-9792.9580078125,-59.540045738220215,10238.878973960876,10298.419019699097,1513.5646673421243
-9822.236328125,-23.74983310699463,10262.927346229553,10286.677179336548,795.7620587488279
-10019.146484375,11.360001564025879,10452.986085891724,10441.626084327698,1776.474319566221
-9345.5908203125,-169.1465718448162,9812.681623727083,9981.8281955719,789.4322773697855
-9844.2578125,-41.59786558151245,10287.661492824554,10329.259358406067,1224.6821571208934
-9965.0,5.739548683166504,10400.634175300598,10394.894626617432,3277.0245679897835
-9486.8193359375,-175.70170402526855,9952.741409301758,10128.443113327026,587.4443331409001
-9902.5732421875,-17.589468955993652,10342.493516921997,10360.08298587799,3655.8574434802
-9475.5302734375,-109.15480750799179,9933.060469448566,10042.215276956558,1288.390855151284
-9159.7451171875,-437.8952579498291,9667.917481422424,10105.812739372253,723.1301934051465
-9867.9873046875,-29.224661827087402,10309.774517059326,10338.999178886414,669.3427127959726
-9808.90625,-59.682820320129395,10255.475187301636,10315.158007621765,1627.3552335187553
-10097.8349609375,18.08184051513672,10530.228723526001,10512.146883010864,1554.7925182489037
-9177.0615234375,-337.14352440834045,9672.268360853195,10009.411885261536,2529.9572331022246
-8895.181640625,-427.3500952720642,9406.345016479492,9833.695111751556,780.6109961827796
-9909.1806640625,-54.749948501586914,10354.71642112732,10409.466369628906,1117.8761939273406
-9923.974609375,-7.574643135070801,10362.761669158936,10370.336312294006,919.3703874469926
-9907.125,-31.076621532440186,10348.746656894684,10379.823278427124,3003.2529837182165
-9771.595703125,-72.50288820266724,10220.849169254303,10293.35205745697,1357.0905295132743
-9870.048828125,-63.718804359436035,10316.804655075073,10380.52345943451,2362.0472765455384
-9613.2470703125,-121.05451899766922,10071.467122495174,10192.521641492844,1292.5855030624978
-9566.98046875,-288.2667908668518,10049.968645572662,10338.235436439514,1306.6606273105208
-9770.3515625,-105.9583044052124,10224.419191360474,10330.377495765686,1202.554818161459
