trian_config 
gae_lambda:0.95 
 gamma:0.99 
 clip_coef:0.2 
 max_clip_coef:4 
 vf_coef:1 
 ent_coef:0.0 
 learning_rate:0.00025 
 ratio_coef:0.5 
 grad_norm:0.5 
 max_version:1000000 
 pg_loss_type:1 
 enable_clip_max:True 
 use_noise:True 
 enable_ratio_decay:False 
 enable_entropy_decay:False 
 enable_lr_decay:False 
 enable_grad_norm:False 
 enable_adv_norm:True 
 enable_mini_batch:True 
 gae_length:256 
 num_envs:16 
 num_steps:512 
 use_gpu:False 
 mini_batch_size:512 
 tensorboard_comment:gae_length_256_num_steps_512 
 check_reward:[3705.0787501540935, 3883.54278633019, 3689.4242651441896, 3023.8139226268754, 2476.649575828238, 2534.147867998522, 3636.653078007834, 3701.533613368458, 2336.837695363294, 3636.727149978114, 3693.776370182157, 3711.312355281747, 2524.6630697412274, 3659.7979810571605, 3673.340062784427, 2623.2846170477465, 3737.4764140281604, 2970.46256795474, 3879.127768539067, 3642.4518001424076, 3665.874092079369, 3666.08794443536, 3193.9584061328305, 3643.6316719232645, 3726.997190258402, 3494.17192443945, 2679.058848825088, 2419.874009966637, 2917.7388615946998, 3873.1800339095867, 2542.125798492853, 3673.92962398815, 3328.590547540174, 2632.010334717954, 3665.5700371986527, 3709.1723343716612, 2961.315540538809, 3680.7287757346603, 3691.4048708467294, 3145.90226116073, 2577.42694479866, 2600.064422022925, 3132.644754186152, 3102.4088644875424, 2451.5276937962935, 2647.7933214621216, 2693.597688976109, 2579.8483749546886, 3752.33309857827, 2810.7990294769124, 3574.314419768053, 3583.8763712882355, 3666.0996386632196, 3659.3270456127, 3637.9209481828275, 2576.392472536943, 3709.995372092034, 2751.802287167645, 3548.593464125206, 3851.595409592303, 3680.0846035899585, 2627.781622719883, 3643.6356254070656, 2947.2985560437437, 3287.466967875748, 3457.5822490025967, 2676.2987052356057, 3848.3072748284035, 3176.001207967566, 3634.236669526457, 3043.6930262615697, 3291.2385676800313, 3338.5284894276747, 3544.2874392641256, 3627.8521997949874, 3668.3701777127817, 3334.9311176932815, 3729.8215155306343, 2780.742471770449, 2937.5419961311627, 3619.511608053357, 3269.7775154899073, 3871.945899701418, 3664.961658058787, 3576.6004271606175, 3152.2250522893946, 3670.3129424220188, 2939.825471743704, 3328.1709793614564, 2086.9429511111844, 2902.9720152538057, 3720.3934254189153, 3371.26040658686, 2790.6793676869083, 2897.244479390991, 3806.303479584267, 3688.132303753587, 3649.023936566259, 3651.5401000439424, 3265.354350705616] 
average_reward:3291.5866529532923 
check_reward:[3423.3903029607627, 1023.8411593475439, 3437.728446394648, 3418.1885473261373, 3438.7735680259902, 3426.7433840302883, 3429.536448152132, 3422.6342743974196, 3425.1679828190386, 3399.90923429437, 3400.3406558886372, 3420.233488343007, 3448.3292569206405, 3437.9421418468, 3452.0410935404925, 3431.79562875547, 3429.6387053326725, 558.8103979612277, 3408.9130921696515, 3430.4652790552877, 3410.0379550910648, 3440.7841062934363, 3452.8095361453024, 3441.0363643879246, 3450.694111565164, 3441.597609517189, 3411.2327690252027, 3430.0263579871216, 3422.0575465976603, 3443.724808289494, 3449.0214098406577, 3426.0169886101703, 3419.8826677141988, 3434.099123922887, 3417.384145209372, 3416.2659397129873, 3405.4504624534256, 3426.8718342237325, 3433.5479789164715, 3422.8795166806285, 3454.2205807689784, 3412.2485297401167, 3401.4293694440166, 3418.9723970892305, 3443.5494970926757, 3444.2809175137336, 3443.4151272480904, 3415.576482016173, 3390.686510963843, 3427.1753136445454, 856.7034868404328, 3434.801053804088, 3420.0377243832195, 3435.896102690399, 3453.035117055235, 3426.090859477227, 3418.960918677467, 3420.689785093714, 3415.1252247856028, 3451.2616005551354, 3409.949541456045, 1229.9044701960236, 3410.703710159058, 3435.2477264126114, 3409.622100870491, 3442.548112774488, 3417.59040044937, 3428.69881813142, 3426.9371770083553, 3423.742871824612, 3429.0039859543263, 3402.048549793002, 3428.8190706480304, 3429.647495540323, 3441.3638109701287, 3442.127824060609, 3439.9676226015017, 3462.2468120363637, 3414.7382535838206, 980.8974868615375, 3419.027526467629, 3423.019676656512, 3425.170493064792, 3419.0325206536127, 3439.0077199436478, 3435.303115501131, 3397.677096297798, 3449.1935766928777, 3432.523508216342, 3438.502645853036, 3419.389878451452, 3423.447941165901, 1349.098240622393, 848.9522798695447, 3430.7568878810107, 3404.9022971244644, 3428.4290643567097, 3418.419760749418, 3430.0531767296397, 3420.0809659356396] 
average_reward:3256.017951321959 
check_reward:[3727.0931329036293, 3698.8051884251795, 3699.7496367245194, 3699.4203823513453, 915.2590221385358, 3721.8167928135153, 3682.0859453871326, 1586.7548913296882, 3712.6581405450415, 3723.1080577210073, 533.6515843973974, 3676.7140771514682, 3680.194786046952, 3700.7545229142975, 3684.733874376544, 774.0959260181539, 3691.917113288958, 3735.382435702735, 3723.889998398064, 491.10945549752046, 3698.9813807172077, 3674.4118528608305, 3720.8718037700537, 3716.0803897963515, 3739.555841102982, 766.028423848373, 3692.299134013334, 3693.2196761640457, 3691.7481634030028, 459.06985286663496, 3709.5976769594986, 3681.0668347574456, 3667.9059147719668, 3696.566681087311, 811.6076647229736, 3711.7552895651797, 3707.061645220938, 3705.7387231085086, 3686.8944159923667, 3741.584979109957, 3683.026851115384, 3701.682025244857, 3695.7367167782177, 3683.350179624365, 3662.32729909404, 3712.9811938151774, 718.4631297481955, 3728.3938236227, 3727.904715905593, 3732.6383703761076, 3724.3283484240983, 603.4911839193046, 3707.4097159772773, 561.4394007330825, 3725.15798386575, 683.807738829829, 3696.735201448982, 3720.7664018822184, 3724.7914670244118, 3707.4166077781897, 3655.8853379922175, 3705.9858366312073, 3706.7718883592506, 3685.518319558566, 3694.4283573431394, 3720.0739620773857, 3727.8571361253053, 3706.7636924452445, 827.848381341321, 3701.8870570360286, 3726.2209575806337, 3701.480384316904, 3692.0694410130905, 533.7381897693526, 3716.519369679021, 3702.0344457983874, 3730.271243835536, 3722.1600668103747, 862.5662495467632, 3714.78096252694, 3721.1508545328084, 784.6598249729087, 3736.3106251672807, 3688.685593590419, 3684.6819538581067, 3677.8803281617866, 979.4579847776845, 3716.1630363110726, 3671.808764804225, 923.2375932283044, 3713.9631606498942, 441.444548233578, 3701.2008220831694, 3689.8733514540736, 3701.058776112779, 3695.9611076883357, 3701.156830466395, 1108.949779286152, 3716.9641291905955, 3681.3467802206324] 
average_reward:3117.039067877553 
check_reward:[3367.9338231595257, 3361.5305952293597, 3356.9008893104183, 3327.435973884021, 3333.2925257089614, 3371.055834155353, 3358.2104166894487, 3359.5112408541954, 3382.037932069712, 3320.0645441858164, 3361.2781844221518, 3353.2771285618887, 3355.4183183053265, 3368.7793757111804, 3367.057689018229, 3331.4890221746286, 3367.7402179052633, 3355.5440322385984, 3361.027143066817, 3377.169863533705, 3370.479769297937, 3356.8192747582816, 3325.1464864580066, 3336.696289156267, 3384.832863388108, 3366.327807693575, 3356.517964414525, 3353.659740190973, 3358.6026388262953, 3354.322286331778, 3354.06073197364, 3351.092265358091, 3352.1713891444624, 3375.425072177788, 3353.9108186332664, 3370.187750818028, 3358.00830768011, 3361.818469068103, 3371.195329792421, 3376.488451442937, 3355.2498678628085, 3358.5680501166426, 3368.4373359534447, 3362.001428876059, 3363.6530402809612, 3367.260526622362, 3361.9961093317643, 3359.340098481907, 3371.526189637222, 3354.506915169006, 3357.970003236601, 3368.17423511462, 3355.085261623322, 3360.6896249999745, 3356.9896379688953, 3364.5544174170664, 3370.5865194005437, 3357.391670724857, 3356.870507073879, 3362.47449609446, 3362.486710136785, 3321.2565730043407, 3383.5391661756103, 3357.8780965747, 3362.728377118027, 3355.3663358244394, 3369.108067354511, 3367.8329512483974, 3375.3172344917452, 3355.202546971088, 3371.674767858322, 3353.695541640919, 3361.827613373946, 3351.812017260271, 3363.305769397415, 3358.790238143297, 3376.665121345098, 3360.0608915577277, 3354.1383453710096, 3366.6712118129385, 3313.8978687921485, 3351.312810409583, 3361.3998096463547, 3374.2509704353406, 3356.7998707118268, 3319.265921557755, 3359.7037755282026, 3367.6893423508745, 3357.9837108822794, 3349.057655184101, 3357.043351212205, 3351.813788643338, 3360.9242691282043, 3367.182940699663, 3377.840533700055, 3364.4560890997036, 3365.6349440049844, 3352.3295744622255, 3358.3454427275656, 3356.4511656781515] 
average_reward:3359.1058580429067 
check_reward:[3432.7120208994456, 3441.2224836983905, 3437.949730678052, 3435.836971597724, 3437.5354134530626, 3439.9392311509737, 3439.3817856826327, 3408.3041441686937, 3441.4993720580205, 3433.6870672214554, 3404.519593610442, 3436.583455194716, 3408.462679965646, 3439.456048341758, 3432.3838820534534, 3432.702160682633, 3445.1803696155844, 3417.871109763178, 3422.592130302877, 3410.915622423132, 3429.0541031357725, 3437.9879006313736, 3427.9819734045395, 3416.335296677499, 3426.215699419271, 3417.6715259124126, 3421.1199739837725, 3430.7547790981203, 3430.1134411977855, 3438.3093826056156, 3428.689187424514, 3430.913173839382, 3411.6134752602425, 3412.5806762961765, 3428.8729206156477, 3443.5508947790377, 3435.9562079879433, 3437.262636819454, 3430.827458147317, 3441.0493787253467, 3433.6323602544853, 3435.5989011711513, 3441.0344815359595, 3411.766722100618, 3431.772597811414, 3444.5209848200802, 3431.4270814784504, 3418.7675484872216, 3409.4107847869673, 3410.8619525125164, 3409.3975580945903, 3428.2440554770014, 3440.6868247212806, 3429.4099476280717, 3438.758313147198, 3437.0857129031074, 3437.512875524255, 3407.5593977666636, 3441.432923800453, 3443.9618481000252, 3415.3679275420827, 3416.5053325020986, 3410.4937903146088, 3433.3668063953082, 3425.6749888581508, 3431.4873445079284, 3413.3491360344715, 3413.2581502348903, 3406.0877372430323, 3437.4508636261753, 3421.52465933877, 3437.262043759073, 3429.5861879222957, 3429.3975526723925, 3438.0959162988856, 3429.0762295691884, 3407.0692673783233, 3434.005913175339, 3431.6466111469344, 3427.9505542468137, 3431.458436525175, 3413.254089383412, 3425.771385400343, 3440.394109780401, 3423.678146490554, 3432.2323823314086, 3411.22788663935, 3426.2480853381885, 3427.2003166941936, 3431.7780713199454, 3439.410638800565, 3412.016435917891, 3430.3499501798015, 3431.514962861295, 3430.74599859093, 3440.4012850985973, 3445.3541583673605, 3428.934714963214, 3415.219240283398, 3424.224971364245] 
average_reward:3428.0851050974165 
