# task and env
env:
  env_name: Ant-v4

# collector
collector:
  frames_per_batch: 2048
  total_frames: 1_000_000

# logger
logger:
  backend: wandb
  project_name: Mujoco_LRRL
  group_name: null
  exp_name: Mujoco_Schulman17
  test_interval: 1_000_000
  num_test_episodes: 5
  video: False

# Optim
optim:
  lr: 25e-5
  weight_decay: 0.0
  anneal_lr: False
  device:

# loss
loss:
  gamma: 0.99
  mini_batch_size: 64
  ppo_epochs: 10
  gae_lambda: 0.95
  clip_epsilon: 0.2
  anneal_clip_epsilon: False
  critic_coef: 0.25
  entropy_coef: 0.0
  loss_critic_type: l2

compile:
  compile: False
  compile_mode:
  cudagraphs: False
