plan_type: 0 ##0: sin 1: Guassian 2:step
Random_seed: 1
model_dir: "./model_dir_PPO_1d_static"
log_dir: "./log_dir_PPO_1d_static"
gamma: 0.99
n_steps: 100000
ent_coef: 0.01
learning_rate: 0.00025
vf_coef: 0.5
cliprange: 0.1
nminibatches: 100
noptepochs: 4