train_steps: 5000000/${action_repeat}
action_repeat: 2
iterations: 8
latent_dim: 100
batch_size: 2048
lr: 3e-4
first_step_qr_only: true