trian_config 
gae_lambda:0.95 
 gamma:0.99 
 clip_coef:0.2 
 max_clip_coef:4 
 vf_coef:1 
 ent_coef:0.0 
 learning_rate:0.00025 
 ratio_coef:0.5 
 grad_norm:0.5 
 max_version:1000000 
 pg_loss_type:1 
 enable_clip_max:True 
 use_noise:True 
 enable_ratio_decay:False 
 enable_entropy_decay:False 
 enable_lr_decay:False 
 enable_grad_norm:False 
 enable_adv_norm:True 
 enable_mini_batch:True 
 gae_length:512 
 num_envs:8 
 num_steps:512 
 use_gpu:False 
 mini_batch_size:512 
 tensorboard_comment:gae_length_512_num_steps_512 
 check_reward:[2131.5540154352666, 2250.573914814762, 2351.454951397235, 2127.4093507903435, 2167.528382298471, 2284.046148762369, 2078.9756360932715, 2097.7932001486042, 2328.904422055736, 2120.2866064798873, 2283.5134759058737, 2069.8231646418535, 2348.475590413113, 1471.2940765153744, 799.0075950791, 2088.559698736258, 2087.835758459859, 2312.3651848622835, 2038.739822425749, 2151.3233965291065, 2099.0857552127627, 2204.2191891864095, 2072.8946312727194, 2136.077118182675, 2167.787035706764, 2182.548627084103, 2270.7114352951166, 2281.097835432345, 2249.4940693587478, 2162.863304071853, 2354.648503330545, 2305.086405278734, 2149.4934585372002, 2152.3916942927135, 2270.180936936376, 2218.5258538254584, 2195.262226351195, 2267.5035421496855, 1909.3620939467644, 2220.4845196563624, 2183.3173957268436, 2307.7957536701433, 1291.638910320276, 2215.180923301368, 2354.3663913991677, 1966.1861364203185, 1472.0993236814593, 946.6961521966331, 2101.261381074275, 2469.2994719154967, 2283.169702537564, 2221.596263700785, 2325.450401753701, 1916.491274152284, 2069.471704863597, 2164.2535840068495, 1750.2894675718412, 2182.707374453679, 2095.5632289194773, 2319.9716130617016, 2143.11511014965, 534.0606031963971, 2120.752478257596, 1003.2954505716363, 2319.4914788067726, 2079.08723526373, 2191.7432364095157, 2168.4771652357563, 2244.9161209488275, 2234.828486500176, 2225.0732115049386, 2153.5605095432193, 2314.49692351713, 878.9134779479608, 1478.0331175636636, 1997.755215713406, 2358.151495074185, 2272.7977501157275, 2291.388025693478, 2241.2258094489616, 2207.0584119470277, 2247.7106487708706, 2269.393307773811, 2254.36698457101, 2058.515335968409, 2301.6435405581256, 2250.4498706016575, 2201.09313417215, 2315.0945736270965, 2166.1697132085255, 1408.3014683242568, 2212.385899133712, 2256.2413790189685, 2159.0020091008014, 2219.9122983772722, 2221.1546985462724, 2298.1819772024164, 2211.902418971619, 2417.273155257639, 2335.1059401684247] 
average_reward:2093.581087484433 
check_reward:[1716.537232153707, 1783.383737684039, 1747.853544077052, 1679.0226560991428, 1813.9535324959693, 1742.5438428536308, 1678.1791413312965, 1788.591428314392, 1640.8416276901678, 1785.6092267764554, 1735.9592843083028, 1698.3592317310909, 1710.9423387990992, 1779.377052281948, 1738.8600483705538, 1499.4842863100412, 1784.0254675690403, 1690.691882578845, 1806.2038177404675, 1722.5728593767576, 1865.8714294917288, 1681.1339319415902, 1631.9488891001663, 1975.934844029351, 1580.5543217196252, 1728.6736009077658, 1760.5338007089242, 1767.8068664211828, 1738.6000046686977, 1592.4586173752043, 1802.2755235994018, 1545.958493140785, 1933.8308901929884, 1544.9064037554986, 1586.5363243484132, 1760.4275220517598, 1736.6925323596438, 1699.5555388219461, 1592.7718911463157, 1834.5344631707671, 1591.8582916029795, 1719.6564701103143, 1515.3879966547315, 1800.4150618232563, 1682.3788102038284, 1744.785714200858, 1691.2822450543104, 1765.2515836860864, 1634.6803897185823, 1601.2070796880973, 1650.336498014161, 1768.7833303121665, 1588.8430567686516, 1768.2625313455242, 1712.8259010929646, 1490.1252325003256, 1675.1030111584264, 1643.3785085079344, 1794.1749027852513, 1678.704018237147, 1679.2451556127883, 1785.300931945168, 1764.048810872046, 1709.4252274277137, 1703.6116937549546, 1604.818235308541, 1690.1435992089991, 1924.593974910147, 1746.1978950777996, 1730.0032592942807, 1655.6690090451507, 1640.111252176194, 1652.2499399904762, 1718.6870527213464, 1873.2161605239423, 1655.992860162442, 1342.661963964404, 1918.534533153677, 1814.828719577399, 1704.7084543797318, 1900.452052546618, 1770.3199266930064, 1794.8886567766908, 1626.752862410687, 1722.0095287158777, 1677.5528502898783, 1806.036838352596, 1703.9391421074988, 1776.6908542367441, 1721.9546506983957, 1765.896092811502, 1512.1220665121177, 1561.1279723980329, 1791.7197974612905, 1532.2132879346254, 1766.3376374284478, 1894.4621619823847, 1660.0819831136646, 1892.8419713177298, 1518.6039976297677] 
average_reward:1711.314918214841 
check_reward:[1928.431751220402, 1971.024635029295, 2054.813824397661, 1934.593875533238, 2196.7477549469336, 1921.3069260769994, 2018.292567261144, 2170.5660628679384, 1891.9087839766096, 2063.4004304191612, 2122.3547331580176, 1920.4393086783832, 2024.681099429706, 1602.6317970322907, 1210.722874448368, 1573.6472140371268, 1302.9155954351093, 2027.209951382421, 2164.2852371894705, 1915.3251909586402, 1982.9241738346534, 1950.6780780621061, 763.9773970695171, 2101.5725175595016, 2083.1753467029002, 2111.7018986023704, 2129.467311544899, 1796.0990223248393, 1894.2701559052202, 1817.5882038906389, 2073.2122683826165, 2104.9846313610014, 1880.7064026196458, 2159.999695275043, 1882.8434514430578, 2004.500804426826, 1763.2646112486914, 1944.4781391696356, 1897.257854382579, 1803.0082304349426, 1836.0201450562345, 1949.799006905824, 1785.152470917932, 2013.4496583864209, 1943.0190624728302, 1958.6628228749787, 1875.8224591132048, 1905.5495807324, 2222.314255929757, 2075.23027027897, 2152.9938303625318, 2053.9149806325577, 1897.0978196043636, 2167.5583064362936, 2193.777203495405, 1741.163317849729, 764.492628732084, 2080.753867410776, 2060.6159770821437, 1915.4112887132796, 2227.0125264140997, 1895.0611299342154, 1962.4857172244494, 715.6430278774558, 2153.1064395283533, 2114.0164138085593, 2188.6101759877765, 2119.0431878247264, 2087.7291886404055, 1784.5939945374719, 1791.4506666776383, 2247.6952352559783, 1961.7451638951402, 2039.0453530799825, 1929.11526714719, 1778.5930922633152, 1705.4996762035257, 2147.4052590139618, 937.5337261299792, 2244.5363159053973, 2149.9668349792782, 1953.7534218651772, 2002.8186865078635, 1626.6789014242124, 1817.1048340772106, 1989.224820244221, 1980.3026917256948, 2061.9695782527115, 1832.2309239704396, 1111.6648377075442, 1780.1625417412033, 2148.956028218391, 1674.2843591858257, 1902.973985137285, 1947.4874177823713, 968.4108906155831, 2164.353357262721, 2011.2183589074814, 768.2658914458233, 1984.7668871943895] 
average_reward:1886.6032556630237 
check_reward:[3917.873490516945, 3932.8820659704784, 3962.15242081843, 3980.642803554339, 3995.199667975475, 3938.8146162583207, 3904.932159863977, 3924.6478015900907, 3942.213871206175, 3932.818042856893, 3953.4070335627343, 3940.33709339435, 3949.4697776594408, 3953.3358540936324, 3953.4809970280958, 3964.967865256585, 3946.667725187373, 3971.6543029439727, 3962.1743134687244, 3923.1481620501722, 3968.3876923504963, 3920.875022641463, 3923.699308235381, 3940.220444783499, 3947.9362960325393, 3966.142354999116, 3993.990371611781, 3946.7087887809284, 3962.582731840266, 3939.4452566019695, 3967.765131955669, 3956.849653156988, 3978.5383412380966, 3996.398878637895, 3936.844354548766, 3940.5351668081857, 3916.9711674479095, 3925.677471339992, 3921.4634838069896, 3950.9800447161483, 3936.9374164085893, 3963.98142314745, 3957.707227932682, 3958.914244613305, 3919.573053071279, 3949.4954736428563, 3945.800703609263, 3932.198364090037, 3947.3470149467853, 3995.008326431082, 3931.3840899507422, 3956.1439864934646, 3955.936875774286, 3959.754594448313, 3941.3303382932263, 3946.632441792629, 3924.0633503549925, 3946.930783921028, 3910.5218799629893, 3970.229625577259, 3968.3336359060004, 3918.4966005175856, 3945.925712897214, 3960.610919895962, 3948.7677704946273, 3938.834943051013, 3971.689211779795, 3915.952145808882, 3987.3025168978347, 3982.6520599057535, 3923.8461660624125, 4008.525545501105, 3924.1558160080367, 3929.721888349728, 3916.736941436533, 3917.113466575577, 3925.35888897667, 3939.826463715974, 3982.785316882129, 4001.255620567202, 3923.5360278559847, 3933.9191532056457, 3906.613799280108, 4001.57414569062, 3921.0364585772436, 3951.113432357167, 3972.8808919356406, 3948.6758709975093, 3993.7206461411884, 3970.3394353274416, 4008.0612445591764, 3972.0882660936068, 3923.8199657689647, 3930.0413308040966, 3963.496018104708, 3969.3172931212644, 3950.4229239135852, 3975.26396316003, 3936.0091275616433, 3960.1214806968583] 
average_reward:3950.2266634763496 
check_reward:[1842.0124213267186, 1717.751393741553, 1673.556444981119, 1847.2730524448425, 1648.8098638575761, 1702.2168537728066, 1823.6622686477326, 1898.6389760069665, 1785.8465272703706, 1684.9543144983088, 1793.8148953429863, 1615.052696674747, 1777.19885117447, 1791.2968656809353, 1758.3960017181118, 1705.0624227488358, 1669.24948108128, 1738.457148747421, 1831.4531614307552, 1750.5439924086259, 1838.8584102121704, 1701.2624393639185, 1748.351502815106, 1747.3123335219457, 1792.3670607648223, 1601.336517226991, 1659.2064264605672, 1859.6513567398829, 1519.9475397863052, 1757.0021815665818, 1686.171867942434, 1781.4037066085853, 1678.3569425067135, 1787.4025766640245, 1684.988712658558, 1787.8618778633086, 1723.7516751000467, 1762.202666600798, 1724.5855309838944, 1772.1560164334242, 1669.9798832218598, 1848.1681676930002, 1862.1058607470347, 1664.5972451843113, 1898.9920128890099, 1775.39669324625, 1715.5219538251545, 1696.1814830225928, 1829.1621558773381, 1774.7417540279662, 1621.5446001774749, 1689.7459823206098, 1752.454103363109, 1626.130778026746, 1739.0006996276568, 1627.1473819318044, 1623.6447775441593, 1744.3050781969446, 1690.3393796003265, 1773.0565793528726, 1779.7908515918948, 1665.2337458946683, 1720.731380134353, 1782.3721870836653, 1728.3879149899792, 1770.1975547387724, 1866.6136969497827, 1680.1325491375164, 1731.0076287769575, 1687.007949746508, 1694.181348088457, 1722.316858085746, 1889.9101484232701, 1721.981772132894, 1690.1174827244201, 1685.2377029385052, 1891.9552751037686, 1799.0062530185717, 1771.2844439239905, 1804.455299460737, 1843.210849485481, 1815.7302397998735, 1594.8653477484345, 1673.9834280116074, 1754.731107923281, 1745.1100617737798, 1714.3544743858915, 1638.4591066032654, 1691.477149986084, 1718.746375187036, 1742.9658986430927, 1895.4444075569759, 1785.6928269557752, 1661.1124990263825, 1638.912650817716, 1805.1292039735956, 1811.8973000903347, 1727.7302080107158, 1776.5755452663166, 1593.2695516586234] 
average_reward:1740.029618211012 
