learn_reward: False
num_iters: 4000
use_acquisition: False
rollout_all: False
rollout_sampling: False
use_mpc: False
