# @package __global__

defaults:
  - /alg: deepltl
  - /rl_alg: ppo

env: CartPole-v1

model:
  actor:
    __target__: jaxltl.networks.mlp.MLP
    hidden_sizes: [64, 64]
    activation: tanh
    weight_init_scales: [1.414, 1.414, 0.01]
  critic:
    __target__: jaxltl.networks.mlp.MLP
    hidden_sizes: [64, 64]
    activation: tanh
    weight_init_scales: [1.414, 1.414, 1.0]

rl_alg:
  total_timesteps: 5e5
  num_envs: 4
  num_steps: 128
  num_minibatches: 4
  update_epochs: 4
  gamma: 0.99
  gae_lambda: 0.95
  clip_eps: 0.2
  ent_coef: 0.01
  vf_coef: 0.5
  lr: 2.5e-4
  max_grad_norm: 0.5
  anneal_lr: true
