learn_reward: False
num_iters: 4000
use_acquisition: True
rollout_sampling: False
n_rand_acqopt: 1000
use_mpc: False
