learn_reward: False
num_iters: 1000
use_acquisition: True
rollout_all: False
use_rollout_data: False
rollout_sampling: True
n_rand_acqopt: 100
use_mpc: False
