# @package _global_

agent:
  name: 'ppo'
  clip_range: 10.0
  clip_obs: 200.0
  tanh_policy: True
  gaussian_policy: True
  ob_norm: False # needed to be turned off when pix input
  encoder_conv_dim: 32

  # policy
  policy_activation: 'relu' # "relu", "elu", "tanh"
  policy_mlp_dim: [1024, 1024]
  critic_ensemble: 2
  critic_mlp_dim: [1024, 1024]
  actor_lr: 3e-4
  critic_lr: 3e-4
  max_global_step: 1000000
  rollout_length: 2000
  encoder_image_size: 19
  is_chef: True
  # encoder
  encoder:
    type: 'cnn' # "cnn", "mlp"
    image_size: 19 ## TODO: env specific
    kernel_size: [3, 3, 3, 3]
    stride: [2, 1, 1, 1]
    conv_output_dim: 50
    soft_update_weight: 0.95