env: antmaze-large-diverse-v2
seed: 1
pretrain_model: models/offline_trained_models/antmaze-large-diverse-v2
discount: 0.995
lambd_cool: true
antmaze_no_normalize: true
eval_episodes: 100
eval_freq: 50000
work_dir: train_finetune
lambd: 0.06