env: antmaze-large-diverse-v2
actor_lr: 0.0001
discount: 0.995
actor_init_w: 0.001
critic_init_w: 0.003
antmaze_no_normalize: true
eval_episodes: 100
eval_freq: 50000
work_dir: train_offline
buffer_size: 5000000
vae_lr: 0.000005
DQRA: true
lambd: 0.06
ood: 0.15
