trian_config 
gae_lambda:0.95 
 gamma:0.99 
 clip_coef:0.2 
 max_clip_coef:4 
 vf_coef:1 
 ent_coef:0.0 
 learning_rate:0.00025 
 ratio_coef:0.5 
 grad_norm:0.5 
 max_version:1000000 
 pg_loss_type:1 
 enable_clip_max:True 
 use_noise:True 
 enable_ratio_decay:False 
 enable_entropy_decay:False 
 enable_lr_decay:False 
 enable_grad_norm:False 
 enable_adv_norm:True 
 enable_mini_batch:True 
 gae_length:512 
 num_envs:8 
 num_steps:512 
 use_gpu:False 
 mini_batch_size:512 
 tensorboard_comment:gae_length_512_num_steps_512 
 check_reward:[1036.223877817196, 1024.6041888863522, 1029.8750987258795, 1038.548517163889, 1027.13829856735, 1035.2357775703365, 1028.761264894981, 1018.8142100092347, 1015.8677365252496, 1037.3552676710174, 1055.1701318575401, 1020.8954238741951, 1051.5632845786167, 1039.9774717422936, 1051.6568117614165, 1018.1900054110288, 1039.3179876049585, 1027.0227755432509, 1054.2541468738236, 1007.0253195869353, 1021.8952392960726, 1032.9916326850082, 1021.5408969414026, 1050.249832615383, 1031.7908551226815, 1015.0884891655732, 1032.783066329977, 1012.9107800210475, 1023.8787986332509, 1023.1903841154101, 1017.4243477041882, 1043.5928691637455, 1048.5640974050593, 1038.5858749053928, 1029.5573280731687, 1035.162955380805, 1020.6441078341155, 1044.9247364894259, 1063.1903396832188, 1053.570895421075, 1022.0784773023239, 1027.6467544873376, 1027.1136844215114, 1032.2585437570606, 1027.5196109917165, 1028.5783446373453, 1024.0121231060882, 1056.5070059544846, 1044.5982075013344, 1045.2912899401767, 1032.1978635666483, 1015.3482399625369, 1029.4776814432475, 1052.9974967677117, 1030.7318246946056, 1044.2116620605266, 1021.5291168233352, 1029.2612118156776, 1037.1186821155497, 1027.466497371863, 1018.6682023831867, 1034.95870183418, 1028.419988762595, 1037.6150782107536, 1039.51681274561, 1028.2264660117241, 1040.39576339561, 1029.4911843314412, 1023.8090408072642, 1043.8146415723481, 1021.9515940248939, 1024.4883384482778, 1025.4227568770866, 1024.2772082765882, 1028.7071229977316, 1014.173028331402, 1037.828740819842, 1066.949564762893, 1015.9606807627413, 1041.8554724287196, 1028.0496343996983, 1023.7757485134991, 1039.5666877851486, 1046.2735363936017, 1034.484449500681, 1065.0141977005082, 1076.5836412213177, 1037.5850737479273, 1027.128275560275, 1025.596565946913, 1027.481357774896, 1013.0694261968788, 1043.5564410922336, 1037.3328264757952, 1026.2137281437076, 1014.746631227317, 1041.4156873114316, 1059.4168418627983, 1034.975875063974, 1020.2476803560512] 
average_reward:1033.2402413643215 
check_reward:[975.171272201025, 976.8760127029902, 979.758553877468, 977.5364124047442, 975.7799120496513, 975.9297395305839, 975.2307076870113, 978.809261113209, 977.3705545916928, 976.8135827683232, 972.0152723821716, 973.293419152423, 976.3498183639239, 968.1977306705686, 974.5814942919808, 973.5716542978275, 975.7692876615035, 975.610581018524, 977.8539622097485, 969.5920069353626, 976.775106390131, 979.680599886887, 977.1901364344726, 975.9180741737596, 979.788023186915, 973.3460187206853, 974.2383654110749, 976.6545054488803, 981.3158576443931, 974.9963478221227, 976.0769341318904, 973.279299429147, 974.1153288852769, 974.8301469325836, 970.6710694573196, 974.7026463397451, 982.7541788502962, 976.4600729441463, 980.3202644658069, 974.6263373342347, 976.1291015343072, 974.5591332167845, 972.4013971182258, 976.7686633689589, 978.5963268247209, 982.6103002062337, 973.1095240150719, 978.5771540198657, 977.9924973414439, 976.0013939471953, 979.7550805187936, 977.1573631715676, 976.2031398576405, 973.5814325838487, 977.1012840613115, 979.2830389968047, 978.5400146429236, 977.7599547601942, 976.4447985259987, 973.8078919352723, 973.1869609043172, 969.9573293887995, 971.0414817421378, 978.8993986132981, 977.1387308059258, 977.6707787786387, 970.8225068470506, 974.1106968146346, 969.023519907202, 973.5656213381636, 976.9258378419522, 965.4913146585844, 982.151087695726, 978.0535053868616, 974.726095739335, 982.7069491738418, 973.3683106408108, 978.8045169757279, 973.3788006578379, 978.9680737946891, 969.0168759026121, 979.1688403661827, 977.511313165845, 978.1323282676276, 978.1371599293825, 977.7799862222231, 978.0157615318074, 973.9576754228826, 973.5640332173468, 978.3907361205063, 975.3734096949015, 974.4728554681841, 980.1611615097909, 979.115857949422, 980.7490544929776, 977.0919306084552, 977.6725406398308, 973.0469281598592, 973.8928208657135, 973.5396507890882] 
average_reward:975.9901247847785 
check_reward:[1072.3331248848963, 1056.9450104096668, 1036.445263199987, 1065.9372531476215, 1050.8811932638478, 1034.9710248867964, 1115.1625773163692, 1049.7484451785374, 1038.04047945697, 1040.0778172968066, 1061.4034327882, 1029.0325825813434, 1116.2217253995395, 1104.1996006908091, 1049.1906521473904, 1041.5408997343425, 1025.3847605126007, 1062.2594923558117, 1104.3434924097726, 1101.4286231119222, 1071.7070235773208, 1068.1007661856258, 1066.078432540118, 1114.283183186747, 1072.986553800514, 1115.0887600730362, 1018.2780118121419, 1104.7134117571268, 1082.1653063392923, 1031.0977695859428, 1076.4566483416384, 1068.5932074256382, 1106.9509380919494, 1050.1918387502983, 1056.4098409636936, 1122.876676955707, 1084.8255522328293, 1037.6965405426427, 1051.1894181834055, 1061.7918761393903, 1114.6366865416048, 1086.132057498434, 1052.5685056672626, 1056.103534046864, 1071.0471315558586, 1084.8734809694176, 1057.4071106014208, 957.3820845351659, 1041.1185259939014, 1060.5139343240946, 1109.0510266109568, 1082.1164990698624, 1145.2968143276657, 1031.657734274911, 1039.0018920107022, 1072.651439800454, 1054.805810268167, 1029.5627212214458, 1096.2203837743164, 1022.5515243190633, 1069.0102373473733, 1076.3938274666293, 1041.5936245805985, 1019.48979204748, 1078.881696689912, 1079.2721538225246, 1067.1249979149402, 1062.7543313388865, 1033.9821517839869, 1055.2929802394708, 1120.3781386715646, 1083.8084802409408, 1105.2313626370617, 1063.98980066487, 1069.0124771627181, 1078.8727819987778, 1099.2860680919034, 1048.2169961812533, 1065.952239643224, 1053.436202529153, 1086.4879626880017, 1054.6112350052128, 1071.232439677674, 1068.2724317900515, 1062.3910366895998, 1026.9832684425573, 1052.060621798915, 1041.0140764883872, 1070.4737466670074, 1034.4033532310461, 1071.734535223378, 1017.5708681679163, 1018.584552761014, 1012.1810760461703, 1027.8366926481476, 1062.5496115028925, 1084.0147703977264, 1046.416016077504, 1057.2043793463943, 1050.7921201112733] 
average_reward:1063.70523240484 
check_reward:[1620.9715312140365, 1599.5724687377558, 1560.9375450603734, 1577.4741457035457, 1591.5364850450474, 1557.7898644610518, 1597.9776159560593, 1577.476784985052, 1622.8366903110964, 1609.5697723970504, 1574.6611963412633, 1619.408383905759, 1604.8946193796048, 1607.1467847451202, 1532.5620032569823, 1552.3129908534793, 1595.0506094756179, 1610.9665916835643, 1484.059021668665, 1618.5246074749966, 1614.951926347791, 1595.6820636823213, 1563.701045589576, 1608.2353901297233, 1595.5113597054676, 1593.4818010210156, 1600.1527811309481, 1588.019536578441, 1603.050902759153, 1587.6148836967504, 907.5034783610279, 1604.0779459264481, 1587.462722435415, 1626.2695184990125, 1543.6472309691692, 1601.7530087414978, 1544.29110739669, 1624.6698569207056, 1559.6315184168598, 1586.0273656799022, 1621.622602343883, 1590.6002653955557, 1579.9513743034468, 1616.402256087231, 1594.0810263566975, 975.8962245204177, 1570.8317621405827, 1561.8556995050667, 1563.3265717511058, 1590.4988994702435, 1609.988625294964, 1584.423536083958, 1623.2231074984136, 1585.35321536701, 1569.5465515355713, 1591.4670021613654, 1561.2429255911163, 1590.9472236156648, 1593.7083540796843, 1595.5727267472707, 1596.4043287624395, 1591.5041198882368, 1594.663887066511, 1611.5259923414105, 1548.8553871829886, 1544.9789620476595, 1568.3737311817722, 1605.6467646973292, 1579.0379407849578, 1588.430422285357, 1600.278528812295, 1542.2970361908792, 1608.2359327252104, 1554.185489044757, 1595.3150705105566, 1572.2512249370604, 1576.9680057198686, 1518.8027400332242, 1614.2087292923047, 1568.5982912118288, 1625.2990112202333, 1592.6485555377308, 1623.5317425828637, 1614.7379586557277, 1572.6371082803234, 1624.7304359748696, 1615.14522138537, 1568.966587709066, 1594.2146139560632, 1602.8435014332404, 1512.7463605488422, 1599.4361070922146, 949.9183557232045, 1616.2752531333886, 1623.0339048726853, 1539.6763457488255, 1611.7400598118202, 1587.2409174100426, 1564.770299334774, 1586.6498814277807] 
average_reward:1568.28809913049 
check_reward:[2138.4440099103217, -20.056401486057457, 2109.905683733065, 889.2529043198643, 2162.414852988923, 2180.6449954697846, 916.5283108505502, 2081.6572721162015, 2177.2795735687796, 2089.880542157323, 2219.657542668837, 2139.6918367352073, 2163.6887972467093, 2189.970502078254, 2140.494419046086, 2192.0822185471875, 2093.8936408217214, 2171.633395622399, 2118.933383612958, 2092.5804279739696, -26.469101490450896, 2211.9723469457604, 2040.283980169135, 2198.3222982849584, 2119.919631934976, -23.68463187892666, 2187.8916077275935, 2184.849964585094, -26.863618347757665, 2201.3913647511654, 2131.6528634798315, 2090.596705897938, 2108.206529459447, -13.545278173741044, 2142.307213206012, 2192.0498894611346, 2127.9363133609622, 2032.7450623574534, 2139.4385013901883, 2151.5891334534035, 2124.2814877869578, 2159.433540262757, 2176.4058500880465, 2144.5813547735884, 2164.2384092342304, 2186.093867361514, 2124.241476388659, 2126.992402072717, 2084.2573704228334, 2129.0084534278835, 2128.676816423998, 2185.056002689716, 2084.930260498734, 2201.433526013367, 2178.0399000085663, 2194.4661378108813, 2106.655368460914, -14.676092408170403, 2174.2491938812736, 2041.2866847979067, 2166.8653584690333, 2138.208927019203, 2187.9265109620737, -20.026631992559917, 2019.7646514330554, 2162.0258112813144, 2143.944812185232, 2102.0836105771664, -18.951006041575052, 2078.253475855723, 2081.997155671711, 2073.129042130183, 2077.6115608710525, 2133.0665970212017, 2061.621783569544, 2114.9491955509593, 2169.6259753075674, 2157.124502553598, 1964.165983856426, 2056.355209633357, -18.203566991434087, 2176.744815277092, 2176.1586299523115, 2187.2606533094995, -18.453010076576245, 2132.3137985295134, -17.296227026442075, 2098.2894142518107, 2206.374800269684, 2055.253197388143, 2204.6499722075446, 2136.2965391781518, 2127.4644644942096, 2121.484036879734, 2113.305209072084, 2117.7246353903956, 2199.365608285684, 2097.081504644542, 2131.254286391472, 2116.6376202405077] 
average_reward:1873.1226960213485 
