actor_lr: 2.0e-4
value_lr: 2.0e-4
critic_lr: 2.0e-4
layer_norm: True
value_dropout_rate: 0.5
alpha: 0.1
log_dir: tf-logs/benchmark/antmaze
eval_episodes: 100
eval_freq: 100000