trian_config 
gae_lambda:0.95 
 gamma:0.99 
 clip_coef:0.2 
 max_clip_coef:4 
 vf_coef:1 
 ent_coef:0.0 
 learning_rate:0.00025 
 ratio_coef:0.5 
 grad_norm:0.5 
 max_version:1000000 
 pg_loss_type:1 
 enable_clip_max:True 
 use_noise:True 
 enable_ratio_decay:False 
 enable_entropy_decay:False 
 enable_lr_decay:False 
 enable_grad_norm:False 
 enable_adv_norm:True 
 enable_mini_batch:True 
 gae_length:512 
 num_envs:8 
 num_steps:512 
 use_gpu:False 
 mini_batch_size:512 
 tensorboard_comment:gae_length_512_num_steps_512 
 check_reward:[53.91083255692726, 51.777024188430126, 53.201772571218996, 51.9722641667351, 52.423537486590625, 52.54359263534981, 52.54389002464282, 54.59759102228689, 52.66063424405489, 53.13745818122152, 52.63469216453322, 54.63765519230213, 54.02916787731526, 52.73917410756262, 55.0259842906817, 52.72211999817878, 54.91670053559065, 53.305104113956865, 52.25044404437477, 54.78852946265479, 53.97869068237677, 52.01680431561192, 54.6466985975175, 54.41084613020165, 53.01653156830407, 53.71232950650181, 52.84622423422072, 51.768762503771754, 53.971637247045656, 54.48774594426943, 52.61266790093977, 55.086732696152126, 53.48295324346298, 54.565799885885234, 52.960091614175134, 53.86150676799109, 53.66348080435065, 54.77951823496768, 52.97106353950506, 54.345687094082805, 53.80256757458977, 53.449568887414934, 52.09946184172328, 53.938798976325046, 52.877200959045766, 53.02522774381276, 52.598030401917114, 54.4047847225744, 54.65284865721067, 53.47926975728313, 52.306640217821396, 53.34445445082257, 55.34327946861188, 54.55354826025094, 51.73470461479597, 52.552929131610284, 54.24577020837725, 51.960593409558285, 53.166272105376464, 53.045569570382696, 53.311789375691006, 52.2789891840341, 51.89878710781862, 52.89487788192287, 52.12837251423406, 55.225716377963806, 51.335916445580494, 53.76598331112714, 55.287325149193045, 54.11935191576448, 52.7927556873182, 55.50478159985068, 51.85830239910706, 53.877157062686436, 55.39954669911894, 55.67157567321355, 53.09221100620371, 52.48174501285182, 55.16667642094201, 54.243210774720936, 54.688702454950246, 54.7856839136263, 53.101984104242156, 52.87275048469717, 51.690019147631304, 54.197808064913964, 53.83952661157572, 54.151018359915575, 51.94335548936821, 54.367548310868784, 52.71986704446129, 54.16498942706157, 55.19819175594379, 52.69020125890055, 53.75191082023619, 52.279648312142825, 53.25797783657722, 53.87906161050889, 53.279275882514504, 53.54410694088629] 
average_reward:53.48324161765812 
check_reward:[78.36750421279243, 80.10709323401286, 79.72425883047588, 77.96857370423217, 75.9376241237405, 78.27932528975548, 77.71053933139781, 80.60955399046088, 79.89128469027929, 78.6467681844183, 78.78794468406161, 77.91868438156769, 76.23178360158846, 78.68956565254706, 78.48083045488599, 76.05653961831592, 77.08737491276909, 76.32432974203206, 75.83990821349084, 77.40432837822783, 80.31618806634904, 78.59440146772451, 78.59702952216392, 77.36037044979506, 78.87848731615695, 79.66186764099201, 75.54532568049174, 77.18434533995833, 76.49647091287407, 77.03659047097466, 76.26357916423547, 75.17291435166165, 75.81354367980882, 79.44628965869907, 79.09764386705044, 76.92188291218807, 76.41625021908249, 76.01291019468809, 77.08681669907585, 80.74028772769748, 80.37049837883364, 76.46328741859368, 78.72616643473953, 80.02104137813087, 77.73556214421507, 78.06449854367905, 80.51420680301531, 78.08493892724918, 78.13522080149602, 75.23212527432537, 77.09773043541861, 77.58798223392256, 78.54607938618717, 76.19973164392758, 74.40134770478736, 77.55826011006789, 79.60028761861818, 75.3965856810419, 78.81196119234062, 76.36188595850709, 76.6509029280717, 73.23767193532268, 78.80177104482613, 77.8234285696418, 78.8376300077611, 78.38417227438106, 74.98529952556757, 76.71053814241742, 79.84752298783134, 76.51180667779693, 76.17483093133832, 75.83288926578386, 77.56482421199783, 79.37961721967052, 77.4074357669246, 79.10750947979926, 79.84310576950921, 76.32879474968574, 76.96157478066011, 75.66240768067027, 76.90871942234901, 77.55782725643401, 80.5427831929173, 80.2783258678578, 75.06899523679101, 75.56761389915816, 73.98491015172196, 77.87502056088043, 76.63346745420156, 78.05694721434897, 77.68563317595236, 77.25367264639608, 78.78468353971343, 75.32891860449938, 80.44025036770533, 79.41418072612748, 78.84697739708301, 76.33938515828899, 77.76050221319502, 78.61551595511138] 
average_reward:77.66614472632206 
check_reward:[81.32957912176838, 81.63056999807965, 80.40503281620005, 80.73861200880242, 79.94197958458554, 80.80752049143831, 81.94150419677102, 81.81626130129592, 81.61467095080988, 81.12619971252929, 80.20643719892036, 79.41250369784412, 82.41756006604732, 79.71117627151932, 81.10710979921151, 80.764492882971, 80.17728326615143, 79.19716195163902, 81.43516913745181, 80.85287295665441, 80.30540704235203, 82.64244394683092, 80.47916060582412, 82.05275227303407, 81.94640215909129, 79.63873309412028, 82.02911751991039, 79.01360573125277, 81.67970767268926, 82.31784551924902, 79.73216393905439, 81.98046693904419, 82.68768095161148, 82.86175635785636, 82.09136704366105, 82.10043034526247, 82.7992756036769, 79.68934796006167, 80.90530077754815, 80.50707253435905, 80.36066814007563, 82.28960747719509, 81.85329935859394, 81.01289964516394, 80.71719549261994, 81.8161359457624, 79.71810274728514, 80.5535337484172, 81.93902012721506, 80.46863722507251, 81.72348694160056, 82.5489403255523, 82.6624807925192, 82.1157986088603, 81.06045369692934, 81.68082465084842, 80.75485139928456, 80.13389914498609, 80.15172710953323, 81.77087171337814, 81.82265676137503, 81.80620746936687, 82.61119857382276, 81.1171136817065, 80.87398421279016, 81.08006253551291, 81.36003018515376, 82.31814420410424, 82.41048126320453, 82.02214885933843, 80.3744817178759, 80.8987118069881, 80.48362332684827, 82.1942988062496, 80.56364894295997, 81.65633760577606, 82.35892731005143, 81.1800790646462, 81.60965269511014, 82.16462463375282, 80.85854881666748, 79.84699399591304, 79.74842180084825, 81.25435244752698, 83.31516448839022, 80.2772424483357, 80.67998342534435, 83.0567336060279, 81.38491646306105, 82.6143918555262, 81.88713872542948, 81.26961334400205, 82.2739249565469, 81.54935279954616, 81.01701443641511, 81.38714035997309, 79.93273544210672, 80.30967067838203, 81.90903480266213, 82.72516470382887] 
average_reward:81.2763012297124 
check_reward:[54.67891709649027, 57.11111331276132, 56.01902129473996, 57.37762922849013, 56.88763782333707, 54.015466106764464, 54.25167807175433, 54.39892767137003, 54.16196643358923, 54.85189966091852, 53.899919005785584, 56.200056718725236, 54.50322558539482, 55.35342209883365, 56.31404970387633, 55.88105277214258, 55.43084428519374, 55.68242757249469, 55.38107093433587, 55.16077475247429, 55.49826562841782, 56.61013551612276, 55.35919798301507, 54.403689380380015, 54.88047024437249, 56.3272952246931, 56.32303053668947, 56.34990305459946, 54.52789657624891, 56.18594433329747, 56.790022694024074, 54.58047600345958, 54.64026704920029, 56.45654455717528, 55.71798656314604, 54.6807716219461, 55.20904848317491, 56.344598488612185, 56.00092928235878, 54.20609178572669, 54.74358706503747, 55.90614553178681, 55.19659951494217, 55.26548562393746, 55.64958518338892, 55.99260491646597, 56.26698620981146, 55.65583699160234, 55.44523092704434, 56.27651300559147, 55.615917130484625, 56.98426551444544, 53.502692769063465, 56.31406624198654, 56.77671338808833, 55.076915391085606, 56.17003742366734, 55.580770122616244, 56.32383715175637, 57.25127405830417, 55.60918528544322, 55.78984355889236, 56.11667603183392, 55.78281662946719, 55.07109491929113, 56.35568304851506, 54.336002241672574, 56.57695503299108, 55.24719667952787, 54.79500518616038, 54.562029537432686, 54.99960482610536, 54.216612222088166, 56.38069747809156, 57.2068669362848, 54.7902205348485, 55.647718656061215, 57.15077484698504, 54.72655714703932, 56.468358776510755, 54.783441927494444, 56.45438223469129, 56.78920813559933, 56.5348998587724, 55.62266204524917, 56.89176590285143, 54.66082197650984, 56.88989497652685, 56.43923691741597, 56.59270862375397, 55.873492016858506, 57.15151612286817, 54.47386087746552, 54.784386744409076, 54.99637378375622, 56.493394881071104, 57.01789013445091, 56.154854408738814, 56.13239307621975, 56.966002000627135] 
average_reward:55.68181815517811 
check_reward:[75.92234717057366, 75.53171302566498, 73.85891819859148, 75.53597944617438, 74.3584160950856, 74.86610273417848, 73.10587257255162, 74.30028354165347, 74.95455537325353, 73.44028299206511, 74.37889419331268, 72.89277804706072, 74.53149161859076, 75.43594776499141, 73.39664269640845, 74.23047197563872, 74.32694976553532, 75.2304212299451, 74.61025001770392, 73.87716429075871, 75.82570240884338, 74.27224546361269, 74.77196361534936, 75.05906363989021, 73.46171601316459, 74.32087735220178, 75.22492770587665, 75.77788070961176, 74.060596731172, 73.64260543191703, 74.88412593692759, 76.11682069010183, 73.79419010872401, 74.87150267879113, 73.42122862987625, 72.50654044613937, 75.50341468978738, 73.03480332191856, 75.01042305990146, 73.55367383751067, 73.01982799166507, 73.36908010817909, 72.68610746756842, 75.24683489042648, 73.1631396619712, 72.99222640371785, 73.38458607423499, 74.07161723622674, 74.33677387295413, 75.52780551447879, 75.5291959377669, 74.39416807085175, 74.99453023015013, 73.95954281606627, 75.16610659702108, 74.08119505117946, 75.63465045671936, 75.20935665057412, 72.2881005034257, 73.93782377561102, 73.15877060560939, 73.54183637045865, 75.74721652498442, 73.97053160053963, 74.95328720540004, 75.33640859254425, 72.91663191912168, 74.8017742678504, 73.238157600382, 75.14942187901829, 75.89591396973297, 73.61657336492712, 73.9796406564378, 75.8685329037263, 73.6195554828295, 74.5791888947957, 74.9865831896569, 75.14974681027323, 73.93288146024187, 73.83761480737033, 75.8062836400728, 75.60552483632554, 76.79878680011262, 74.79935936433438, 74.71914239265581, 74.28148760984323, 74.2308717714239, 74.19764713800733, 73.36197212603349, 73.01102173861696, 72.89294896335102, 74.74998280152458, 73.34738836884763, 75.09715410937437, 75.51692925734639, 75.06079016641957, 71.49424380696016, 76.30070781347781, 73.51198687957972, 73.75195263828218] 
average_reward:74.37708904860335 
