meta_data:
  script_path: run_scripts/evaluate_policy.py
  exp_name: test_policy_eval
  description: Evaluate a policy
  num_workers: 4
  num_gpu_per_worker: 1
  num_cpu_per_worker: 8
  mem_per_worker: 16gb
  partitions: p100,max12hours
  node_exclusions: gpu048,gpu024,gpu025,gpu012,gpu027
# -----------------------------------------------------------------------------
variables:
  seed: [11992]
  method: ['gail-lfo']
  env_specs:
    env_name: [# 'invpendulum',
               # 'invdoublependulum',
               # 'hopper',
               # 'walker',
               'halfcheetah',
               'ant',
              ]
# -----------------------------------------------------------------------------
constants:
  ablation_study: true
  # expert_name: 'hopper_sac'
  # expert_idx: 0
  scale_env_with_demo_stats: false
  minmax_env_with_demo_stats: false
  state_diff: false

  policy_checkpoint: './logs/gail-lfo-walker-union--gp-8.0--spalpha-1.0--idbeta-0.5--rs-2.0/gail_lfo_walker_union--gp-8.0--spalpha-1.0--idbeta-0.5--rs-2.0--2020_12_27_23_19_11--s-0/best.pkl'
  eval_deterministic: true

  policy_net_size: 256
  policy_num_hidden_layers: 2

  num_eval_steps: 2000
  max_path_length: 1000
  no_terminal: false
  render: false
  render_kwargs: {}
  render_mode: rgb_array

  video_path: './videos/'

  env_specs:
    # env_name: 'walker'
    env_kwargs: {}
    eval_env_seed: 0
