loss,margin,positive_reward,negative_reward,deterministic_return
0.0,0.0,0.0,0.0,-0.3847263093484723
290.31842041015625,755.2514614351094,1176.1156285479665,420.8641671128571,58.58402124561677
305.0264587402344,609.8675178289413,1919.2490029335022,1309.3814851045609,846.4126560779785
308.5067443847656,576.6074769496918,2096.0101838111877,1519.402706861496,4960.386085580596
310.3863220214844,556.1327993869781,2176.479686498642,1620.3468871116638,2191.820324888269
310.86676025390625,551.6884245872498,2231.425772666931,1679.7373480796814,5019.974432181573
311.6833801269531,539.6398289203644,2269.9826827049255,1730.3428537845612,4926.489174851554
312.309814453125,532.1601016521454,2305.395754337311,1773.2356526851654,4888.14451493058
312.3453369140625,533.2592406272888,2331.3960843086243,1798.1368436813354,5064.658172732765
312.7671813964844,524.8416080474854,2355.3041315078735,1830.4625234603882,4978.706204165483
312.7822570800781,526.2237815856934,2380.072705745697,1853.8489241600037,4969.991116671614
312.85980224609375,526.5008471012115,2391.718147754669,1865.2173006534576,4988.315398969933
313.34259033203125,519.6928491592407,2405.5239582061768,1885.831109046936,594.3237058196547
313.1264953613281,522.6611695289612,2415.9971532821655,1893.3359837532043,4944.328651082818
313.2120666503906,520.9229907989502,2431.973762512207,1911.0507717132568,4991.314759411113
313.4676208496094,519.8573749065399,2445.500579357147,1925.6432044506073,4950.7679144906515
313.55633544921875,518.1929094791412,2453.212022304535,1935.0191128253937,5067.108008259089
313.4525146484375,518.4500889778137,2464.7770133018494,1946.3269243240356,4922.861674846165
313.6195983886719,517.9713370800018,2471.715292930603,1953.7439558506012,4994.925412783215
313.92767333984375,513.6481251716614,2475.41975069046,1961.7716255187988,4988.67381345643
313.7992248535156,516.8726289272308,2484.4404258728027,1967.567796945572,4979.551951411912
313.5852966308594,517.8823683261871,2488.4985494613647,1970.6161811351776,4960.584425120236
313.8570556640625,514.7487847805023,2494.1840138435364,1979.435229063034,4937.0094653325295
314.3115539550781,509.910049200058,2500.005793571472,1990.0957443714142,4968.697481712354
313.8222961425781,512.708753824234,2508.969666004181,1996.260912179947,4943.991218933596
314.1594543457031,511.93964529037476,2503.4188175201416,1991.4791722297668,4967.844699407874
313.8259582519531,515.8067195415497,2514.741708755493,1998.9349892139435,4965.959646819969
314.26953125,509.66813468933105,2516.443672657013,2006.7755379676819,4963.556758649018
314.35223388671875,507.41234588623047,2515.27489566803,2007.8625497817993,4983.705202111802
314.3595886230469,509.2939977645874,2523.4885120391846,2014.1945142745972,5028.336461642005
314.4352111816406,506.54715609550476,2534.5765976905823,2028.0294415950775,4953.622602260428
314.57989501953125,505.6220471858978,2528.835148334503,2023.2131011486053,4981.456725627877
314.1388854980469,511.32715797424316,2544.6563811302185,2033.3292231559753,4984.835363190761
314.5279541015625,505.91778230667114,2532.9603786468506,2027.0425963401794,4970.239823530358
314.259521484375,510.5893039703369,2542.410966396332,2031.8216624259949,4975.788798765808
314.4473571777344,507.1074757575989,2550.0419821739197,2042.9345064163208,4927.078809156498
314.27801513671875,509.48835825920105,2554.1321659088135,2044.6438076496124,1068.9952730887774
314.6165771484375,505.62957215309143,2547.3683195114136,2041.7387473583221,4983.200801768174
314.3383483886719,508.19328117370605,2549.1810507774353,2040.9877696037292,4999.867188066417
314.5843505859375,505.25165033340454,2560.994836330414,2055.7431859970093,4974.145645850239
314.5664367675781,506.8675994873047,2559.3002185821533,2052.4326190948486,4960.459935289467
314.6281433105469,503.917866230011,2563.2852811813354,2059.3674149513245,4882.598129777787
314.8697204589844,501.0615134239197,2567.632474422455,2066.570960998535,4982.469419720138
314.6964111328125,503.1027936935425,2573.6055674552917,2070.5027737617493,4998.783293007758
314.50640869140625,506.78616547584534,2573.331886768341,2066.5457212924957,5015.628616835271
314.76025390625,503.0089042186737,2569.463583469391,2066.454679250717,4949.814322077574
314.38043212890625,508.1424882411957,2569.141818523407,2060.9993302822113,5020.520254871816
314.70263671875,504.3340759277344,2566.7583270072937,2062.4242510795593,4950.828860103948
314.6553955078125,504.71276903152466,2569.9972462654114,2065.2844772338867,5007.377184169626
314.8279724121094,502.11533522605896,2567.598002910614,2065.482667684555,5017.778186430206
314.9073181152344,502.0251111984253,2578.6491389274597,2076.6240277290344,4988.304248408717
314.7729797363281,503.8007686138153,2580.171407699585,2076.3706390857697,4974.926518702122
314.6810607910156,504.6789903640747,2587.9123063087463,2083.2333159446716,4992.017815508097
314.8950500488281,501.11499857902527,2585.4381713867188,2084.3231728076935,4946.013794445669
314.84136962890625,502.7755124568939,2582.9716992378235,2080.1961867809296,4949.39793886086
314.7361755371094,504.165869474411,2593.897148132324,2089.731278657913,4965.119197938036
314.6263122558594,504.73530101776123,2586.606900215149,2081.8715991973877,4940.045329001188
314.92828369140625,500.44035053253174,2585.840799808502,2085.4004492759705,4940.35858841987
314.8440246582031,502.3783481121063,2589.991683483124,2087.6133353710175,4984.761832608092
314.5733642578125,505.5458827018738,2590.5775809288025,2085.0316982269287,4948.159662139942
315.0641174316406,498.4527950286865,2590.4413418769836,2091.988546848297,4949.9463853313655
314.6474304199219,504.3144495487213,2587.883948326111,2083.5694987773895,1075.8499663327138
314.8232116699219,500.7355885505676,2590.608829975128,2089.8732414245605,4932.855930407297
314.9725036621094,499.8406038284302,2590.7617707252502,2090.92116689682,4931.968209745871
315.159423828125,499.0435447692871,2595.3941774368286,2096.3506326675415,4958.30203854506
314.6328430175781,504.8309361934662,2590.27281665802,2085.441880464554,4985.801049251669
315.21636962890625,497.08137607574463,2595.277590751648,2098.1962146759033,4947.943673450088
314.8823547363281,500.00756645202637,2593.4975056648254,2093.489939212799,4943.421333051016
314.73016357421875,504.4502215385437,2590.8005352020264,2086.3503136634827,4969.178737519854
315.0654602050781,498.82337975502014,2605.7594122886658,2106.9360325336456,4997.797243679112
314.7092590332031,503.6280195713043,2608.497887134552,2104.8698675632477,4983.782733080077
315.0798034667969,497.4778468608856,2611.6355028152466,2114.157655954361,4974.95835447719
315.1743469238281,498.06279730796814,2597.4795637130737,2099.4167664051056,4983.9842158029915
314.498291015625,507.2613205909729,2605.970326900482,2098.7090063095093,5002.377496580887
315.0260925292969,499.78140115737915,2603.9800477027893,2104.19864654541,4964.550523829745
314.89154052734375,501.18402457237244,2612.141172885895,2110.9571483135223,4927.162480025177
314.946533203125,500.6506350040436,2616.986363887787,2116.3357288837433,4919.161973829092
315.04986572265625,499.8067054748535,2613.8871636390686,2114.080458164215,4965.2413730122835
314.9588623046875,500.007981300354,2601.2915692329407,2101.2835879325867,4960.168573527653
314.9910583496094,500.3595700263977,2616.9720764160156,2116.612506389618,5025.236300892205
314.9488830566406,499.1646885871887,2610.800024032593,2111.635335445404,4969.525194705258
315.1865539550781,497.16677951812744,2613.9315938949585,2116.764814376831,4955.299196833798
314.9830017089844,500.0584886074066,2611.1331367492676,2111.074648141861,4960.966968377297
314.99530029296875,499.9401433467865,2609.4836349487305,2109.543491601944,4970.212951035076
314.8634033203125,501.5115644931793,2612.772922039032,2111.2613575458527,5006.530359751471
314.95831298828125,500.59478306770325,2620.4308309555054,2119.836047887802,4949.616026662861
315.0038146972656,499.96252608299255,2612.5604004859924,2112.597874403,4951.647138338533
315.0461120605469,498.73904490470886,2619.7401571273804,2121.0011122226715,5005.384372380803
314.7723693847656,502.99812269210815,2615.738651752472,2112.7405290603638,4938.07171620681
314.8085632324219,503.98452615737915,2620.8091559410095,2116.8246297836304,4999.203946935003
315.1026611328125,497.3974244594574,2616.0541949272156,2118.656770467758,5016.775766040283
315.0211181640625,500.39752435684204,2616.7421736717224,2116.3446493148804,4979.094343522196
314.92559814453125,501.7985985279083,2628.472809791565,2126.6742112636566,4991.084234612146
314.922607421875,500.2599024772644,2622.436197757721,2122.1762952804565,4961.977956821319
315.15850830078125,498.6257236003876,2621.127398967743,2122.5016753673553,5024.971566136573
314.9543762207031,500.5296859741211,2623.498282432556,2122.968596458435,4970.103576030173
314.9615478515625,500.3307321071625,2618.01779794693,2117.6870658397675,4897.931273019346
314.9975891113281,499.5820908546448,2618.5091829299927,2118.927092075348,4969.141632777928
314.9792785644531,499.67055773735046,2618.863004207611,2119.1924464702606,4992.218731745304
314.9437561035156,501.82863688468933,2624.137655735016,2122.3090188503265,5006.072572872775
315.0078125,499.9843065738678,2619.776571750641,2119.792265176773,4966.235046712712
314.8486328125,500.7497663497925,2626.711881160736,2125.9621148109436,5004.847591731123
314.9291076660156,501.2835006713867,2619.415885448456,2118.132384777069,4941.465483238254
315.1958923339844,497.3812372684479,2626.850157737732,2129.468920469284,5003.059880120656
315.3844909667969,494.8151926994324,2623.80441904068,2128.9892263412476,4984.467524847181
315.2641906738281,497.14956617355347,2624.7174429893494,2127.567876815796,5031.971137657284
315.1514892578125,497.3413372039795,2619.866086959839,2122.5247497558594,4954.35509627719
315.0552978515625,498.9192361831665,2630.916527748108,2131.9972915649414,4909.084277899442
315.1927490234375,496.3918981552124,2626.3212881088257,2129.9293899536133,4977.613472082349
315.2185974121094,497.54400753974915,2630.915543079376,2133.371535539627,5017.849795317475
315.1643371582031,497.63131880760193,2626.4770221710205,2128.8457033634186,4956.472312068642
314.9698791503906,499.9738435745239,2634.7339267730713,2134.7600831985474,4991.573092357924
315.0029602050781,498.9606919288635,2629.8078384399414,2130.847146511078,4989.386580064001
314.8338928222656,501.8475618362427,2643.2494287490845,2141.401866912842,4949.818714411959
315.3272399902344,495.9573395252228,2627.6438703536987,2131.686530828476,4921.671302889208
315.3948974609375,494.8194079399109,2629.162003993988,2134.342596054077,4958.159239431388
315.2733459472656,496.41733145713806,2637.122395992279,2140.705064535141,4981.645231272788
315.1134948730469,499.1142466068268,2630.093327522278,2130.979080915451,4964.281029124269
315.1499328613281,497.33652925491333,2635.3507862091064,2138.014256954193,4923.402142815151
315.25091552734375,495.97939229011536,2635.7273783683777,2139.7479860782623,4967.594333776196
315.29547119140625,495.3939709663391,2640.810757637024,2145.416786670685,4929.801278825215
315.3021545410156,495.9499628543854,2635.352234363556,2139.4022715091705,4963.327321347833
315.0514831542969,499.3866534233093,2634.9855918884277,2135.5989384651184,4968.943382203985
315.0253601074219,499.57416009902954,2629.216037750244,2129.6418776512146,5000.6032101707415
315.3931579589844,495.5079824924469,2633.788778781891,2138.280796289444,4956.183711741159
315.1514892578125,497.19832849502563,2644.066384792328,2146.8680562973022,4991.768707074067
315.106689453125,498.9661531448364,2637.019362449646,2138.0532093048096,4970.785337723702
315.2135314941406,497.16529083251953,2647.222071647644,2150.0567808151245,4947.250599768989
315.0562744140625,498.19722294807434,2635.191325187683,2136.9941022396088,5008.322866146528
315.5082702636719,494.5795154571533,2638.397930622101,2143.8184151649475,4960.4022978546445
315.2605285644531,496.8187780380249,2639.0093927383423,2142.1906147003174,4998.430663154786
315.1882629394531,496.9197564125061,2645.91361951828,2148.993863105774,4940.784435856991
315.2241516113281,497.6220180988312,2642.256628036499,2144.634609937668,4987.52260279468
315.0227355957031,500.2444398403168,2639.463143348694,2139.218703508377,5034.894957304213
315.4646301269531,493.70758724212646,2630.33055973053,2136.6229724884033,5014.100622416564
315.1863098144531,498.5562174320221,2633.7758655548096,2135.2196481227875,4918.313676054585
315.10272216796875,498.24560165405273,2638.641486644745,2140.395884990692,5004.285004835407
315.3614196777344,494.96664786338806,2641.568468093872,2146.601820230484,4934.42506812014
315.099365234375,497.41418051719666,2642.787627220154,2145.373446702957,4937.704449581805
315.1185607910156,497.85348987579346,2651.4656748771667,2153.6121850013733,5017.232460186677
315.1509704589844,498.79766488075256,2650.1287274360657,2151.331062555313,4987.919356294625
315.16192626953125,498.65534687042236,2637.2679481506348,2138.6126012802124,5003.619019516898
315.6828918457031,491.69143319129944,2644.14724445343,2152.4558112621307,4915.136565358722
314.9480895996094,500.2178728580475,2645.77250957489,2145.5546367168427,4991.062621226654
315.2660217285156,496.10869240760803,2644.2025270462036,2148.0938346385956,5030.038186489707
315.20245361328125,497.9361832141876,2650.4225096702576,2152.48632645607,4960.036521172206
315.2648620605469,495.9806065559387,2649.8972635269165,2153.916656970978,4982.9139988220095
315.4037170410156,495.90907859802246,2641.9499344825745,2146.040855884552,5030.741449518186
315.1947326660156,498.52037382125854,2647.886435031891,2149.3660612106323,4959.3259662922555
315.0562438964844,499.4612970352173,2648.8908338546753,2149.429536819458,4971.912663374265
315.04180908203125,500.52028131484985,2641.2240715026855,2140.7037901878357,5004.766037685071
315.3041687011719,494.84541940689087,2640.443905353546,2145.5984859466553,4989.770565358628
315.66412353515625,492.46242213249207,2646.668046474457,2154.2056243419647,4965.497763802703
314.9762268066406,500.4630630016327,2645.8164105415344,2145.3533475399017,4985.673149495592
315.3558654785156,495.61779975891113,2642.2023668289185,2146.5845670700073,4926.332486082557
315.0592956542969,498.9276511669159,2649.263605594635,2150.335954427719,4984.59116166488
314.9921875,499.1014449596405,2654.9007959365845,2155.799350976944,4938.419646504145
315.5143737792969,492.8212127685547,2649.8771505355835,2157.055937767029,4922.471218521422
315.3141174316406,497.1984145641327,2648.232714653015,2151.0343000888824,4976.804150919732
315.0378112792969,500.75183033943176,2644.319254875183,2143.5674245357513,4907.061837030093
315.3977966308594,493.8097071647644,2652.1240224838257,2158.3143153190613,4919.992325396141
315.4107360839844,495.7491149902344,2647.306879043579,2151.5577640533447,4925.092912266113
315.0645751953125,498.9860186576843,2647.6297998428345,2148.64378118515,4922.9973101939
315.3200988769531,494.7245213985443,2651.79203414917,2157.0675127506256,5005.469488180982
315.4609680175781,494.56700015068054,2655.6611652374268,2161.094165086746,4979.469785389243
315.1261291503906,498.5522811412811,2652.9976773262024,2154.4453961849213,4953.54573070489
315.4197998046875,494.8633418083191,2650.7249665260315,2155.8616247177124,5008.950797978205
315.3681640625,495.1150333881378,2649.166804790497,2154.051771402359,4882.978075272521
315.1403503417969,497.15504574775696,2653.376721382141,2156.221675634384,4967.357690238521
315.2293701171875,497.4165298938751,2644.3315682411194,2146.9150383472443,4923.666907288526
315.1007385253906,499.0896027088165,2644.946063518524,2145.8564608097076,4973.899831319369
315.2402038574219,497.0829780101776,2646.5207476615906,2149.437769651413,5003.192376437995
315.5228271484375,493.33886098861694,2649.5884580612183,2156.2495970726013,4927.379547987383
315.35589599609375,496.24063062667847,2651.3270287513733,2155.086398124695,4987.607332297861
315.31829833984375,494.842413187027,2646.4512996673584,2151.6088864803314,4982.88891629214
315.4714660644531,493.84157824516296,2649.9744362831116,2156.1328580379486,4980.09929570973
315.2680969238281,496.3957426548004,2654.1856560707092,2157.789913415909,4991.151765702279
315.15771484375,497.9340543746948,2653.616641521454,2155.682587146759,5001.396349245293
315.482666015625,492.6469748020172,2654.5397267341614,2161.892751932144,5008.196820568819
315.6027526855469,491.5892610549927,2649.65540599823,2158.0661449432373,5015.126475967223
315.32257080078125,494.73916816711426,2657.618015766144,2162.8788475990295,4980.872092846716
315.190673828125,496.91176199913025,2659.255799293518,2162.344037294388,4983.458714565127
315.3320617675781,498.95609760284424,2656.67272233963,2157.716624736786,5026.872378156452
315.0760498046875,498.2437882423401,2660.05561542511,2161.81182718277,5021.771876837778
315.50048828125,493.8220853805542,2656.653639793396,2162.831554412842,4998.603822587186
315.1570739746094,497.3421902656555,2658.134943008423,2160.7927527427673,4996.479623778593
315.2503967285156,497.4623556137085,2664.3067469596863,2166.844391345978,5016.001769423043
315.19866943359375,497.5641531944275,2654.5279307365417,2156.9637775421143,4968.24857504099
315.2756652832031,496.769903421402,2655.4656071662903,2158.6957037448883,4946.02194287124
315.5610656738281,493.49390983581543,2656.653949737549,2163.1600399017334,4972.142294465081
315.3282165527344,495.35939288139343,2652.6102204322815,2157.250827550888,4992.33781353479
315.2253723144531,496.75684928894043,2660.767447948456,2164.0105986595154,4993.028686114757
315.33648681640625,495.46237087249756,2661.0530109405518,2165.590640068054,5036.578464040392
315.4676513671875,493.78042578697205,2653.138448238373,2159.3580224514008,4971.854980428219
315.0955505371094,499.12922835350037,2658.1786608695984,2159.049432516098,4970.34825073039
315.2173156738281,497.2428367137909,2658.5647406578064,2161.3219039440155,5007.892892658551
315.4057922363281,494.1123445034027,2670.6639552116394,2176.5516107082367,4875.230782178854
315.14959716796875,498.62066555023193,2665.1818675994873,2166.5612020492554,4938.03920810348
315.5385437011719,492.38322281837463,2656.892825603485,2164.5096027851105,4978.257440804944
315.5250244140625,492.9391939640045,2669.2809748649597,2176.341780900955,4987.91209676399
315.431884765625,494.8999936580658,2657.693193435669,2162.793199777603,4996.261713953666
