actor_lr: 0.0003
batch_size: 256
beta: 10.0
buffer_size: 2000000
checkpoints_path: null
device: cuda
discount: 0.99
env: antmaze-medium-play-v2
eval_freq: 5000
group: iql-antmaze-medium-play-v2-multiseed-v0
iql_deterministic: false
iql_tau: 0.9
load_model: ''
max_timesteps: 1000000
n_episodes: 100
name: IQL
normalize: true
normalize_reward: true
qf_lr: 0.0003
project: CORL
tau: 0.005
vf_lr: 0.0003
