trian_config 
gae_lambda:0.95 
 gamma:0.99 
 clip_coef:0.2 
 max_clip_coef:4 
 vf_coef:1 
 ent_coef:0.0 
 learning_rate:0.00025 
 ratio_coef:0.5 
 grad_norm:0.5 
 max_version:1000000 
 pg_loss_type:1 
 enable_clip_max:True 
 use_noise:True 
 enable_ratio_decay:False 
 enable_entropy_decay:False 
 enable_lr_decay:False 
 enable_grad_norm:False 
 enable_adv_norm:True 
 enable_mini_batch:True 
 gae_length:256 
 num_envs:16 
 num_steps:512 
 use_gpu:False 
 mini_batch_size:512 
 tensorboard_comment:gae_length_256_num_steps_512 
 check_reward:[101.79237277710311, 98.72939005087923, 99.28953525568393, 100.59322259451764, 100.99479820041346, 100.8227563631799, 100.9198329410734, 100.18268534098551, 99.86358341592978, 98.44079097875925, 97.56637495647158, 101.09601429347069, 100.36788640027191, 101.59216984670792, 101.78108740623847, 99.17403231899719, 101.05201894152013, 100.99792362807717, 99.14144109138721, 101.27520813845108, 98.37768780670504, 98.44647862743454, 98.99832331633274, 101.8127596655612, 101.91575626820385, 102.8627609619922, 101.24732885716773, 102.47918695951182, 99.63980900593448, 99.87422281135044, 101.25868278295995, 100.55732490733797, 100.74039728542864, 100.13936636601386, 101.14060368528258, 100.8236080347539, 100.64072337769927, 101.00234364101861, 100.23885089187482, 100.86227344889834, 100.99980569528259, 101.60485052493844, 101.43248765664342, 100.56993607297187, 99.23427048668682, 100.82601348898633, 105.44741092546835, 99.31740735033773, 100.04060452432307, 101.39530250734703, 99.45109976804571, 100.46121604112861, 101.75685841263811, 99.0391264856687, 100.64515955391411, 100.89872719875027, 100.60201602298433, 96.51580168165998, 101.96631760808069, 97.48369822322894, 99.93868852068763, 101.54017452078979, 100.99512039507414, 98.25827144179138, 101.6618970764962, 100.55487247182225, 97.8457474004331, 103.75416971952112, 98.69506948373518, 101.94380415582515, 99.54428001189117, 98.89440661138485, 96.62437445025587, 104.21168067150228, 98.22053592009479, 101.1855408752319, 100.99328815944337, 103.65830274390353, 101.26931253701144, 103.83709384633585, 100.05466294811158, 100.36406767978133, 102.13136681413482, 100.83866206283992, 101.20422514111938, 99.61719034163758, 99.97102296645629, 99.21706092702142, 99.06874106188314, 100.96840835702085, 103.0911699689141, 101.18897519245533, 98.93919526929531, 100.72590905033653, 102.18916746936294, 99.10222559541828, 101.74206379422017, 100.56087236889132, 100.67122086728637, 99.29039195248173] 
average_reward:100.52982954712564 
check_reward:[100.6050324511943, 100.66288151355795, 102.66421881620042, 100.07166889331717, 99.93628473720739, 100.14166771782564, 99.56568509711894, 98.63451741342064, 101.71997030725552, 98.82268451195353, 102.26124638569702, 102.98014258700007, 99.97082186997565, 99.79486947589453, 98.85996541481617, 96.0567336058917, 99.28087429133458, 98.60540354806747, 100.6233724088689, 101.0784551550122, 102.1802442899929, 100.70231756225007, 99.38176036048384, 99.74170621262928, 101.90818385255864, 102.20566747830952, 101.03481728345506, 100.35223726903348, 99.85092117584033, 97.69545380449102, 101.27148090029823, 97.09387798838827, 99.97368720439397, 99.26884284167659, 99.77505917392868, 100.77239444320173, 102.95837430711966, 100.80245691914735, 99.11721316574123, 100.86447495591206, 96.45535021241872, 98.8614985569985, 100.68067542690224, 101.5842546945482, 101.51357578337678, 97.56296930310188, 98.99265210021713, 99.9161893286657, 100.90956257282387, 100.53716774475251, 99.10725887698234, 100.83974101995241, 99.57875874224136, 99.45029947569296, 97.57956793710116, 99.51141028566633, 100.77961480506136, 100.10006833469339, 98.84114483733222, 100.16749379051328, 103.75121984303289, 100.9400536822684, 100.3553092933137, 101.49669567933739, 99.4293361952507, 100.35516694663107, 98.81405570449732, 99.70907851704877, 99.46731028823532, 99.67274897307288, 100.34052991121186, 100.56433771430834, 99.73015640248187, 98.61898070193928, 97.23449381388248, 99.46511995698714, 100.77079999396224, 96.20982720609237, 100.39543379852341, 96.3457760272295, 95.59302099712679, 95.33941394182793, 102.95751243216105, 98.74707194798336, 98.56678945768302, 101.21911378018642, 100.50824211618003, 100.00723333624695, 100.22050784518098, 101.89232758328554, 102.83277532573601, 96.7661975570612, 96.35155615941058, 100.61036519104255, 100.92918445755208, 101.80043859541288, 101.34072659192469, 101.11047762422385, 96.16995077942262, 102.68409835513236] 
average_reward:99.91570355943591 
check_reward:[101.4911174310993, 99.52209823921851, 101.33423468197594, 101.73658741714584, 101.6103371392103, 102.55009608078295, 98.09182317135998, 101.56890904746436, 103.4030395748733, 103.28569766982892, 102.56591284843347, 102.62732130052922, 99.02496936292778, 100.71727381061312, 102.17025659631841, 102.21969799012162, 102.59045970984363, 103.49371372867625, 98.7093930861289, 102.40806292318749, 104.44901240677835, 98.81564072947864, 102.48876222383281, 99.9939257546643, 102.63139674047585, 99.69675487553087, 101.27865608928579, 103.28625788521713, 100.6357239109347, 100.95998912609858, 101.61131874281855, 100.28383178718968, 100.99945880268675, 102.77265456796788, 101.036044517428, 101.60535692485715, 99.23613510039347, 100.97837114312182, 100.75475431710146, 100.47758186838345, 102.67914557701903, 101.91002215968844, 104.05770428015681, 99.56914754134313, 97.94053708765585, 101.92258761926058, 100.00760457642252, 101.82635050737768, 103.29751764247355, 101.55496802161238, 101.65033134605137, 104.77049349869304, 102.53324690293677, 103.96297654127201, 101.72501079315737, 104.27878062834937, 102.39180073939391, 101.48554671777141, 100.68841611803401, 103.53819610055893, 100.05485477800384, 104.88746168604214, 104.37841195149021, 101.83198862200754, 101.36048990355141, 103.20810655392569, 99.22773312369038, 102.83630510283814, 98.08779805765151, 103.81033368504413, 101.39089180791501, 100.92740017772852, 102.71659293674814, 102.78777134106592, 104.47055219597843, 101.23673475835426, 101.65622660539046, 103.12150824124345, 99.11811209985993, 102.49883725443794, 98.94585503836909, 99.90559051322796, 102.23372990191604, 100.38056826500483, 103.22915173317449, 100.73163448185717, 104.20203052394221, 101.01820814906483, 101.85836674517662, 100.06778368811385, 105.1356438735394, 102.5890945532675, 102.57513605803024, 102.56619004708486, 102.3586846315381, 100.70665789797123, 101.71938924489912, 102.66130333193695, 101.3024369256301, 102.60630936122436] 
average_reward:101.7330488957115 
check_reward:[91.35888350773513, 93.38718611928405, 92.71730341857986, 91.77320941081814, 92.04646670933838, 92.91355795767583, 93.46188876755028, 90.36184949959707, 91.16318444327433, 94.00160249088171, 91.38198699351253, 91.09276328662341, 90.48974712554954, 93.28309080772696, 89.66994074485874, 93.07731701218167, 93.24290227553247, 92.20396097324596, 93.37370000447726, 91.1416540251515, 92.13316804604607, 92.27324138714265, 92.66197753545654, 89.78377107390018, 90.89107691195888, 93.03314750082869, 91.41175086246056, 89.16223827505684, 92.55371850558662, 93.47760829415999, 93.13767460804638, 91.76401817751218, 91.20086618249252, 92.65345276886345, 92.72493822082048, 92.63323112612527, 92.71077673251727, 92.64021219089473, 91.4898281090471, 91.4342958492646, 90.9472076734572, 92.2330565828895, 90.9883312280663, 91.3701679938442, 90.01871957939744, 89.41158832505334, 92.14847456010192, 91.9643644041129, 92.07457299230863, 90.84375424215065, 92.76605756410692, 92.62189036490521, 89.90328594658762, 94.28358926628894, 90.15640498763206, 91.28589459725217, 92.96204094646541, 90.28373278701959, 91.81735909315348, 92.26698333160888, 92.48381754497292, 92.12584355605176, 91.11583058136208, 93.1936908472019, 92.86324565345026, 90.62856418575117, 90.57270935112349, 92.11803332030112, 92.49684082731974, 90.40980736529231, 92.8530786716481, 93.00376471097137, 91.7765827525233, 91.99869477836583, 92.20328852251218, 93.20799969529759, 91.93033130206383, 92.86484662721051, 92.3762421435899, 92.15833476330018, 95.34251737285055, 91.32276597440267, 90.66554548698922, 90.92970699204665, 93.56534616129224, 90.75861680452034, 93.67541047089709, 93.37026115941268, 89.18275093888357, 92.98388160216729, 90.52850598887348, 90.8753471452453, 91.61279367138616, 92.29451093290135, 91.61427691821517, 92.24999867401861, 90.91880064962763, 90.83210175104207, 92.16864290832156, 92.02293879747619] 
average_reward:91.91556931999057 
check_reward:[109.0284144891349, 108.7136918244558, 108.25283726059676, 107.68097113893327, 107.59095195932869, 109.2207895507376, 110.49740283729426, 109.48741098316174, 108.53090467422751, 108.94674289302216, 109.10108676744272, 110.06024990115179, 108.5423627568542, 107.39937273576678, 110.52070395381037, 109.49822245831461, 106.23738564510467, 109.61949836871261, 108.6153017568187, 107.81196400206535, 106.3379924350956, 110.32599052839711, 107.84864794534003, 109.20549847461936, 110.71402731154791, 110.4714706841186, 108.70134097864818, 107.57631557087329, 110.65235485834731, 108.20898982850977, 109.23086566403853, 110.27414051404764, 109.32870084685123, 109.39479009283212, 108.56533017684451, 107.44240375091967, 107.46718912452071, 110.51318254577203, 108.94875244058595, 109.54507765756269, 110.75997668109495, 110.21367762914777, 108.15154025069674, 110.42270312983922, 108.65054240829676, 109.07371801580973, 108.92242951000347, 106.95713352712147, 106.66136460970537, 108.71765032947482, 106.85289290401857, 109.79386478354587, 107.61651358873561, 108.56709237865368, 106.25413169508401, 111.52635539714117, 108.10599407339609, 110.54733769057043, 110.29795792524976, 108.16388776803247, 108.90738013375417, 108.04904394244083, 109.09611077139091, 110.43929637008755, 107.85370949107734, 111.70424179824985, 107.60708867142927, 109.14479058451128, 109.20027003912264, 107.69591378956795, 106.57119514612569, 107.8192977099995, 108.67064976672657, 108.87413889161819, 107.7658568668277, 106.42083378881561, 109.51479740488047, 109.99010090469608, 109.33104581408719, 109.43333826500171, 109.21700517942364, 107.65845305946672, 107.79411782959525, 109.05196477872053, 108.4085951820793, 109.65454974019721, 108.93757017853764, 108.68913275828704, 110.17612745377524, 110.53284866709305, 108.88673356531704, 107.89563016542292, 110.63595637203821, 109.66542571225568, 109.78863832322011, 108.17204743961013, 110.8478481943111, 107.75334395017279, 107.04725824779798, 106.92238269879917] 
average_reward:108.84190821328556 
