trian_config 
gae_lambda:0.95 
 gamma:0.99 
 clip_coef:0.2 
 max_clip_coef:4 
 vf_coef:1 
 ent_coef:0.0 
 learning_rate:0.00025 
 ratio_coef:0.5 
 grad_norm:0.5 
 max_version:1000000 
 pg_loss_type:1 
 enable_clip_max:True 
 use_noise:True 
 enable_ratio_decay:False 
 enable_entropy_decay:False 
 enable_lr_decay:False 
 enable_grad_norm:False 
 enable_adv_norm:True 
 enable_mini_batch:True 
 gae_length:256 
 num_envs:16 
 num_steps:512 
 use_gpu:False 
 mini_batch_size:512 
 tensorboard_comment:gae_length_256_num_steps_512 
 check_reward:[3375.4672448892616, 6296.710785061448, 6213.800168981785, 3355.9974067030685, 6512.6922087704625, 6216.373713349479, 6480.248295543326, 6264.709319777297, 6341.12810669939, 6417.8690280027095, 4350.47783076116, 6530.197588233107, 6211.908026780711, 6476.082344602433, 6303.492751718492, 6252.276880973772, 6339.579124341667, 6213.507351845015, 6232.155798967586, 2884.6483363839934, 6323.523751408855, 6434.056726206224, 3891.1513195507487, 6348.732155841348, 6309.120806249849, 6428.1517162929, 6476.508324897433, 6305.125605734116, 6348.5514911737655, 6294.962628079596, 6355.929218866214, 2821.0232302722807, 6368.520911449486, 6373.004545714553, 6149.251789985372, 5476.80664305093, 6259.820392125138, 6375.763150075623, 6249.050937909999, 6396.764075380997, 6169.530820184837, 6382.930524392654, 6272.005310076421, 6390.36708977623, 6554.363985072005, 6495.199216348111, 6248.67153014579, 6380.50153891582, 6303.866250531774, 6207.526712565368, 6323.939645403945, 6437.449178826731, 6330.993467128392, 6408.023130266343, 6402.658219920882, 6434.906743040078, 6379.01662788853, 6554.722338435415, 6329.881859484141, 6435.49211932323, 6200.9995725479, 6289.115086789559, 6432.852272852767, 6649.267620888719, 6423.656695744476, 6209.514889812577, 6586.6321358148125, 6281.4972030706695, 4894.503597610553, 6041.0203630001715, 6345.139121959155, 6390.250654146486, 4448.696603247392, 6429.490417829915, 5550.324182983781, 6312.10394109586, 6310.472545550194, 6144.578601463865, 6309.964759854659, 6380.021834946963, 6226.456517161617, 6295.366912191016, 6442.92271601201, 6290.261498744512, 4327.980696384813, 1863.389734288241, 6297.887885544332, 6321.376458593993, 6120.695888133683, 6290.007891213592, 3956.041203965122, 6191.897473641426, 6420.366102558186, 6388.471253389701, 5455.150980812806, 6234.373349699217, 1274.4542824109012, 6410.101695677308, 3435.434295910358, 6484.271437718879] 
average_reward:5940.541984156405 
check_reward:[4328.993408976002, 4272.627440202665, 4105.81321509119, 4266.386229316889, 3912.6403195053617, 4069.6851712605326, 4056.8927059965595, 4013.6408886650556, 3925.4898886514393, 4286.497311284651, 3587.59867248923, 4110.652887516506, 4041.3737689601057, 4012.4769058278175, 4222.243041172107, 4059.877146745504, 4118.561787330339, 4220.279179445968, 4425.109027954775, 3994.568000347048, 4348.542447737043, 4279.742657786938, 4329.356535325648, 4465.887547934584, 1203.878191886746, 3892.3372527305314, 442.8860374265374, 4278.03111051539, 4449.771295922059, 4260.636289904669, 4140.36480540151, 4425.83698363013, 4286.292988886607, 4248.441867511205, 3972.8763884966756, 4210.1949611020445, 4356.631198499819, 3809.1289898125337, 3972.0707667934794, 4014.0209056802746, 4051.3366584817477, 4226.310618084555, 4008.4586395336155, 4073.729971861273, 3797.7339442451375, 3921.2808391381323, 3796.375838969939, 4036.9200971128166, 4057.369620523745, 3938.3207234331708, 3940.835874041304, 4025.1814216301846, 4048.0132864509487, 4084.286517830532, 3995.939415101928, 4116.873973121623, 4270.455787871097, 4334.786217654126, 4391.8545478749, 4069.2856785091653, 3550.76628537339, 4242.2325471003205, 3780.0432757884537, 3898.3870779847916, 4413.387743503241, 4310.756470472177, 2935.9684953582196, 4128.487474797614, 4224.815178110797, 4389.558051458085, 3966.6279950343082, 4206.020470575637, 3263.053456720291, 4072.00523198828, 4055.0004070422633, 4025.7209369088323, 4353.103184304625, 4480.851875264478, 4227.5724272164825, 3568.50093563589, 4059.0234297202005, 4198.224742440041, 4255.2088459011065, 3137.397770268334, 4164.511361251414, 3110.8363115245766, 4312.391526396512, 4079.333891174575, 3999.911915042409, 3944.4890298075607, 4184.753414105135, 4223.061616896472, 4240.431442396158, 3869.0093301838215, 4039.4489429364103, 3981.1192318242765, 4057.1808108094556, 3255.557585442185, 4245.437734617174, 4105.9742271924915] 
average_reward:4001.5984857176254 
check_reward:[4965.813210173651, 5015.300936039206, 5153.919117750949, 5113.699724081993, 5071.002193532324, 5092.869066514452, 5112.240852401765, 5158.537869873965, 5259.913397428487, 5219.24630317296, 5168.643852343317, 5172.857671230657, 5103.878754519894, 5071.99166498994, 5253.935558495589, 5107.73992242673, 5265.08468763466, 5120.632265528669, 5081.361820709291, 5056.170075665114, 5089.734558252784, 5108.417583907791, 5238.157945916412, 5161.820409767355, 5075.239905156461, 5173.420600679528, 5055.900754621318, 5070.328952122214, 5122.053874264528, 4991.403846472525, 5009.181778522456, 5095.094306654981, 5085.980787126413, 5195.652043082317, 5103.169890566525, 5144.086985571872, 5036.709728074724, 5195.645743188639, 5182.031096059625, 5225.8150554293825, 5063.401928959846, 5142.7886186342, 5171.629271449976, 5178.25387945096, 4965.843353740987, 5096.11092250961, 5176.0885872941135, 5406.326940302175, 5169.916661737565, 5236.17725576028, 5051.537333699283, 5104.855908896589, 5110.876836638061, 5068.3967246183, 5112.816920284258, 4837.191504833232, 5203.554394872793, 5227.909954857772, 4982.111910660959, 5107.0969216000885, 5113.595369442249, 5030.777852674556, 5205.558282256994, 5060.128150946302, 5125.886256918824, 5038.753341404368, 5323.761522026807, 5081.216687497541, 5231.801214046765, 5193.708764877163, 5015.750521516267, 5190.016950207393, 4965.280609612358, 5066.082108488959, 5079.884999897048, 5028.53507485202, 4941.775237161217, 5091.05296505265, 5220.290293309178, 4956.018508900426, 5129.264101214386, 5030.442978465783, 4814.332338831574, 5277.979316385818, 5040.991530353517, 4995.506362307302, 5196.744989640927, 5055.872924706, 5103.338477028763, 5196.643546372488, 5259.521548817874, 5138.185698892959, 5168.803739973031, 5141.636975515035, 4935.329711419159, 5079.205689209901, 5004.934690136572, 5097.619645886025, 5128.712999831965, 5196.322927351273] 
average_reward:5112.888355241819 
check_reward:[6204.2754827814915, 6117.188079034036, 6013.085789758588, 4781.794696152629, 6032.041865090199, 6183.453668055034, 6264.75506410214, 6193.995426284002, 6249.551224951699, 6103.652881199264, 6102.129421103794, 6214.199641100511, 6121.930962959276, 6118.33762664301, 6209.172512197894, 6155.575920945498, 6317.673080069078, 6187.1521160289885, 6236.947585778831, 6318.337793099126, 6089.308038805634, 6261.94155562444, 6226.012784180968, 6113.868868647383, 6215.382535535561, 6269.111118443567, 6278.582116872647, 6124.514845672413, 6254.248088970277, 6218.045358232099, 6192.442407476408, 6308.320124222085, 6087.187381803093, 6168.495257115437, 6185.089578061252, 6216.617912019328, 6230.052416558348, 6177.341549611438, 6170.111525783487, 6134.067604809682, 6170.395164622083, 6201.741406883504, 6198.006622804244, 6121.036766027781, 6237.404586765464, 6173.810542622531, 6118.910600655757, 6123.047396730313, 5792.680816432025, 6131.604864578648, 6408.623269966651, 6181.4525073868, 6126.942051053888, 6131.4586716978465, 6263.740536827924, 6258.014422055251, 6233.319314012044, 6142.146089720809, 6198.0467299130705, 5986.875813139615, 6311.81760977934, 6188.313526556323, 6004.621743695943, 6089.921314057216, 6231.3448234494135, 6297.991576777451, 6198.750693280946, 6231.402348206277, 6137.711936527252, 6219.432495611627, 6320.943066955653, 6225.4243551089385, 6174.80971399141, 6260.5945396297, 6304.46222237879, 6184.724259523967, 6077.925320521514, 5068.75899891136, 6245.195815268758, 6278.168334484199, 6220.2950870543955, 5787.364647099265, 6069.536357862614, 6188.575014085004, 6268.131505070058, 6073.130987399999, 6180.670869251239, 6208.645070655599, 6158.435525197025, 6258.486577216994, 6144.067138712951, 6228.632249851265, 6296.234498673737, 6164.467858331056, 6178.435045897009, 6015.639136763762, 6264.611222000138, 6187.950863520937, 6193.518634927541, 6245.7327619122325] 
average_reward:6156.301258258759 
check_reward:[6771.379998968527, 6125.387565224929, 6651.02824992332, 6599.991738863736, 6509.9686949430425, 7106.981603724933, 6593.0401519366305, 5990.959672358511, 3427.3437572581074, 6735.759355069478, 6620.736493711016, 6683.850102029612, 6660.511172722688, 6689.09855943017, 6970.664516024099, 6587.0346888901795, 4175.396444627463, 6399.30441781331, 6856.757499626241, 6854.666566313914, 6630.84549740641, 6456.866421812749, 6640.980522611611, 6739.4294027100495, 6809.52933727701, 7010.911050616481, 6719.3276285109105, 6730.168988146516, 5704.14321616968, 6446.317920821793, 6674.6493560682065, 6599.028321184534, 6820.771016693946, 6593.547940041185, 6654.45724391514, 6604.457754739732, 1714.846426762896, 6253.285785515545, 4770.442951569484, 2253.659669900188, 6629.563199167853, 6786.0135743564715, 6235.1432528091245, 6623.698085886937, 6578.101546120773, 6793.77219016086, 6921.086026255325, 6866.840372125002, 6483.3051629901065, 6971.138554090597, 6487.277689451477, 6862.061705800217, 6928.524882674667, 6438.812603337157, 6865.029331703644, 6629.903122497921, 6829.4384833484, 6996.850692297955, 6623.008062451663, 7020.830703946642, 480.2529497933539, 6813.681091240729, 6707.407982060559, 6690.227576378369, 6745.5747690494945, 6444.35027239567, 6327.073880070646, 6816.458266669239, 6341.255577288234, 6687.118648890674, 6566.627821927041, 6364.1263322613395, 6933.8069607984235, 6651.75439322903, 6724.326288551991, 6266.59265967618, 6507.84079808869, 6792.579870477494, 6706.530082983383, 2261.6043455889276, 3347.1895063871407, 6593.34561755464, 6418.672116530557, 6794.146582301946, 6674.517916990878, 6784.957671632191, 6616.056924756271, 6759.65140667205, 6517.073588935517, 6689.5962399863965, 6655.820084363257, 6748.546820693698, 6880.86094327342, 6774.118065881132, 6960.018697633872, 6935.350691269252, 6487.137476612942, 6888.731187721858, 6945.341349119559, 6659.92703251563] 
average_reward:6353.681774316584 
