expectile: 0.9
temperature: 10.0
log_dir: tf-logs/benchmark/antmaze
eval_episodes: 100
eval_freq: 100000