start_method: 'spawn'
model_dir: './history_PPO_LNet_decision/models'
log_dir: './history_PPO_LNet_decision/logs'
pick_path: '../model_weights/pickuncert_best_succeed_rate.pth'
drop_path: '../model_weights/dropuncert_best_succeed_rate.pth'
lnet_path: '../model_weights/model_rnn_globalpos_globalvar_varout.pth'
input_size: 25
num_processes: 10
n_episodes: 10000
test_period_episode: 50
step_per_trajectory: 1000
num_envs_per_test: 10
lr: 0.0001
discount: 0.99
batch_size: 200