actor_lr: 2.0e-4
value_lr: 2.0e-4
critic_lr: 2.0e-4
num_ensemble: 5
alpha: 0.02
log_dir: tf-logs/benchmark/antmaze
eval_episodes: 100
eval_freq: 100000