total_timesteps: 5e7
save_freq: 1000
algo: ppo
batch_size: 256
ent_coef: 0.01
n_epochs: 4
n_steps: 128
lr: 2.5e-4