max_arm_step: 2
rollout_schedule: [0, 100000, 1, 10]
target_entropy: -3
actor_freq: 20
n_steps: 200000
