trian_config 
gae_lambda:0.95 
 gamma:0.99 
 clip_coef:0.2 
 max_clip_coef:4 
 vf_coef:1 
 ent_coef:0.0 
 learning_rate:0.00025 
 ratio_coef:0.5 
 grad_norm:0.5 
 max_version:1000000 
 pg_loss_type:1 
 enable_clip_max:True 
 use_noise:True 
 enable_ratio_decay:False 
 enable_entropy_decay:False 
 enable_lr_decay:False 
 enable_grad_norm:False 
 enable_adv_norm:True 
 enable_mini_batch:True 
 gae_length:256 
 num_envs:16 
 num_steps:512 
 use_gpu:False 
 mini_batch_size:512 
 tensorboard_comment:gae_length_256_num_steps_512 
 check_reward:[5354.083923955214, 1907.3858499264447, 5071.572412493682, 3818.179153031112, 5235.813088421573, 5089.430514563135, 5172.546960083919, 4895.540338757957, 4001.3997661974527, 5083.046533495249, 5101.412643641336, 5204.801340773778, 5010.133704456472, 3806.3168011248335, 4784.3080769910885, 4646.269258173723, 4577.730852678579, 3602.78094972793, 3979.831428360593, 4866.068777779006, 5186.3108391857695, 5260.004607851326, 5008.449440243754, 2780.70206095043, 5286.531284991926, 5220.2283623388375, 4971.079941337859, 5238.565392466404, 4911.846235162078, 5111.631139358593, 5155.704015176254, 5215.927859705058, 5220.303497145274, 4910.879168375321, 5177.877598124833, 5199.70812945311, 5119.36025172477, 5006.655021108073, 5139.006415056033, 4980.801985977811, 5226.271543301059, 4341.457295792847, 5116.139193720124, 5176.04236203066, 4958.861274786426, 1957.9567287313607, 4773.299196332585, 5277.262695580678, 4962.034354981737, 4835.894166576929, 3405.519834571072, 5190.914152326921, 4923.671502386225, 4809.669924911503, 4918.706861002523, 5097.769829518304, 5363.988919006349, 4349.812801967839, 5101.7307769686195, 5147.647262318968, 5236.426970338679, 3423.0981468523114, 5126.627606790728, 5004.2049938244145, 5060.883545720299, 4999.7950138159395, 3231.864332697531, 5094.870087395075, 5044.151685393852, 4825.874347315484, 5144.456015954313, 4464.788899796512, 4779.858555400612, 5037.4518854391345, 4971.2895222208845, 5004.680112436714, 5193.850927468668, 5158.00577439299, 5023.8266521047735, 3108.2959638185157, 5126.995706370239, 1320.1710304444985, 5144.331296006782, 5063.622192961679, 1431.3866326017326, 1214.6540952356925, 5073.263269508303, 1859.236714130526, 4778.56919979878, 5071.3616291313065, 5105.65994290114, 5121.452796607455, 4797.515557425808, 5266.180669421302, 3946.842651810516, 5101.691221384258, 5262.826928222837, 5129.7998508753835, 5157.483839042929, 5308.92789931858] 
average_reward:4674.611504595565 
check_reward:[4902.671671076021, 4933.720775289439, 4937.279231004383, 4940.719923205226, 4885.2576283221, 4923.813758824288, 4937.894547878881, 4879.9330127282265, 4894.730430024076, 4908.672172652068, 4910.382953532657, 4957.099654436999, 4931.091045735709, 4920.123443744099, 4956.983995204166, 4902.063057533176, 4915.990474421427, 4880.740610232802, 4867.329163734874, 4880.243376590071, 4915.435836372146, 4958.48640998271, 4897.807406287073, 4990.154801554011, 4897.543054156465, 4938.124564723308, 4898.445618569302, 4913.602225732172, 4918.393010826159, 4857.967414272278, 4890.762479098379, 4965.169023043658, 4901.919574016911, 4935.925917093729, 4935.396651575212, 4911.9353005171215, 4909.0434193436195, 4889.231035767445, 4973.137953985962, 4917.944777535056, 4857.32711337568, 4948.016668110076, 4869.371321455916, 4965.4533377529115, 4897.656725423578, 4879.67668711273, 5001.15060556835, 4922.703191044207, 4935.533785377585, 4885.955597207987, 4937.9571042704565, 4917.903302449534, 4914.135584748893, 4880.265591195626, 4940.661290691693, 4962.092595501817, 4911.200829010427, 4846.906633285212, 4910.3004336569265, 4882.795937150198, 4925.569486978877, 4899.324817421959, 4931.799342682927, 4949.63093255913, 4925.546225910788, 4939.884184102836, 4954.949217920374, 4916.2377240241985, 4882.48652156655, 4907.509274443017, 4920.713083450326, 4908.317437242886, 4945.75190623058, 4932.5679648504665, 4926.873201879994, 4946.164383351732, 4983.318525140625, 4924.950186061686, 4892.341435906148, 4891.150568653025, 4870.369524831347, 4939.357845456089, 4902.609233705522, 4896.283893359103, 4878.848892800559, 4903.153110981287, 4870.925335458482, 4954.518858803938, 4905.098626124047, 4897.576247618317, 4905.527813578128, 4900.185010585452, 4834.589371094167, 4883.632280618982, 4849.512126794325, 4958.569481504574, 4902.31976109407, 4930.629503119069, 4933.162207730022, 4935.8969209717125] 
average_reward:4915.080842016205 
check_reward:[122.9006281721865, 3721.4948117952454, 2798.860343379918, 3615.0714357442967, 1913.4256353014925, 3517.7881613826803, 2227.8425097291265, 121.96021508825167, 1941.7425044655492, 3667.577494592516, 3351.1754107996803, 2423.40216855232, 3586.77529358786, 3728.8055967561218, 2745.3783549135283, 1967.9094448762094, 3621.006680086015, 3543.0160005592106, 1653.6922015425007, 1616.5313253880604, 3475.733485528136, 3387.346196738843, 3383.801236377023, 3516.288361760242, 3551.7968047748527, 3580.3896939998776, 3581.3828466174773, 1779.0844909757384, 3688.426755968462, 3600.9412278918326, 2609.01462924601, 2649.82016069748, 3693.676756021223, 3479.213144188779, 3300.4528380324696, 3569.6349104049727, 3593.5409200696695, 3631.2708103630334, 3507.982589286974, 1862.1561338784, 3694.39581270315, 3304.3155202626067, 3411.5360181972533, 2938.8530528401693, 3595.671323248169, 1355.9861286282544, 3274.4937605197933, 3369.1058205067216, 3484.000056272558, 3486.6633110491985, 3819.0471058065677, 3789.973190590889, 3566.573132663948, 3794.77339516748, 98.77304267640747, 1657.0907269020536, 118.65618533129869, 3511.9292680138255, 3389.9371226423546, 3510.4730800514917, 3550.23016096345, 3544.273615735029, 2053.3913317202373, 3606.495133608216, 2201.0171196288493, 3583.12917370945, 2760.253238567969, 3621.417594587142, 3107.2780348904844, 2963.007658358, 3699.7772746737796, 2863.008573820912, 3538.1910160000853, 2487.3373379679974, 3619.3387709773256, 1927.7872831917384, 123.99365237198364, 3529.4336310484196, 1556.4346928323894, 2986.223571430262, 3499.6233134398785, 1701.0605214754437, 3415.1068529430113, 2275.9666687346453, 3284.600134848588, 3438.4324150621874, 3530.858616581744, 3492.128952364897, 3561.160741902368, 3640.9970194471575, 3631.4758007685923, 2602.3721461917457, 3419.9598877385206, 2874.7858052384136, 3513.2542664992498, 3672.0256996483527, 3702.963085476362, 3632.5263460313627, 3753.0772385340724, 3727.114841878732] 
average_reward:3001.9206648449745 
check_reward:[3574.3756596270678, 3714.8083929045624, 2394.463528672417, 3659.931736366731, 3751.3945032067513, 3813.9521882697177, 3512.8641164811424, 3649.9278171670358, 1981.7781478679233, 3755.2013150934213, 2554.0364138016284, 3688.9188964544564, 3420.7399809938147, 1634.6371222738899, 3421.3991216946897, 3712.4852106806675, 3742.459445898593, 3504.7050139922144, 3727.31993759914, 1987.5879351822562, 3833.903707526846, 3492.735679746829, 3631.186205978388, 3539.0849353084877, 3599.8582951476983, 3488.1453237893893, 3553.680821310202, 3638.6627079794107, 3509.1392882399996, 3548.7229879443084, 3580.9725396140734, 3502.8148678781545, 3727.1090309113956, 3645.817574202139, 3638.408497673212, 3356.425032174209, 3672.633227772356, 2020.2572931916045, 3423.8719152182875, 3252.837966302365, 3731.497253061013, 3532.2158217856595, 2730.4349803402474, 3655.099523312824, 3544.766033181348, 3795.799193044872, 3030.312670522508, 3636.9007406906844, 3713.608497557502, 3280.757397737888, 3306.089250899582, 3754.7926125159456, 3538.8407228125943, 3513.813420866657, 3743.860311825332, 3683.833964394144, 3729.830079208454, 3593.1228198596045, 2573.7499898777673, 3651.644632997256, 3620.3836747071223, 3614.6208123984443, 3839.305869309741, 3859.3271432890347, 3664.0167615547616, 1470.5513949994997, 3689.731030631241, 3736.852857915869, 2800.5367640651084, 3618.353904100045, 3444.3405175950975, 938.9289381492395, 3761.3765839258303, 3473.4789774354103, 3750.8158591534943, 3757.9795249925473, 3836.6819339322647, 3170.7757733815406, 3738.2080405361226, 3711.1488134882716, 3628.310975200401, 2806.3962138830293, 3558.7529194219624, 3291.5208448039402, 3708.104352213825, 2728.539344052945, 3653.4914424672675, 3680.0722433978945, 3712.7302094085817, 3648.6868520959874, 3649.751511819896, 3687.5420239176256, 3490.077885440946, 3452.3340467136204, 3662.5392999117316, 2625.6387974074064, 3780.5070436578694, 2950.369856270315, 2387.5121713279, 3744.592933883372] 
average_reward:3399.4511044148658 
check_reward:[4482.029887220316, 4505.204731333792, 4476.148223290889, 4514.274618802204, 4464.760208046147, 4360.997730063229, 4510.290615163101, 4474.4705901324705, 4508.109811027184, 4457.770450525799, 4346.8780528222205, 4576.488549589252, 4402.45898461725, 4482.869349874994, 4458.437279136204, 2970.819194609073, 4416.049291218167, 4456.684334673826, 4530.284157326833, 4448.81601693827, 4420.000354633038, 4503.012181098673, 4470.731646455701, 4385.051767364688, 4476.898917161974, 4393.63811675438, 4484.49771015783, 4441.262985301068, 4443.59058717709, 4459.170644576872, 4476.755226312222, 4491.160464977625, 4509.709634539845, 4461.05760115569, 4474.085787312777, 4466.526983771441, 4516.386057282689, 4500.448831276978, 4497.817754435726, 4512.188674063133, 4499.163001445049, 4491.830206138644, 4483.953178340642, 4372.432945441953, 4512.558879303769, 4434.657958381027, 4516.347504080914, 4513.13024416753, 4499.862284357263, 4467.835487412698, 4461.060411551141, 4352.218314152153, 4448.491601074545, 4403.754889492452, 4500.6252149126985, 4457.778625056351, 4424.356717259134, 4492.905555669049, 4424.42414010757, 4445.678248310428, 4454.790332418315, 4519.691284003924, 4416.554300324623, 4475.60302818901, 4464.5271888047, 4383.511056164453, 4430.915724591774, 4524.502323578595, 4416.879715520223, 4481.24160704054, 4404.736334381128, 4466.431454911513, 4496.210363854895, 4467.882212109061, 4444.123066396942, 4501.70446183668, 4449.677154834655, 4425.222971540668, 4466.4180993957125, 4462.0737377251335, 4512.446605765437, 4519.457347717633, 4326.609081030365, 4470.860695797112, 4473.542721346076, 4448.791315328483, 4407.132982437202, 4535.062333406526, 4382.589130053722, 4538.147554793729, 4501.289423737735, 4486.988126408971, 4449.090685287786, 4506.647428119627, 4477.406720942015, 4377.098285601964, 4559.524174795948, 4464.58772249284, 4456.985850775378, 4505.17086244329] 
average_reward:4449.8302487478 
