# @package _global_

defaults:
  - ../env: null
  # - ../method: adm

demos: -1
pixels: true
use_pixels: false
frame_stack: 1

# important config for adm
ignore_qvel: false

# Safe-IQL specific configs
safe_iql:
  # Dynamics model path (relative to work_dir or absolute path)
  dynamics_path: null  # If null, will try default location: exp_local/models_eefnp/bigym_${env.task_name}/snapshots/best_snapshot.pt
  
  # Action space for k (downsampling rate)
  k_low: 2
  k_high: 4
  
  # Safety threshold
  epsilon: 0.01
  
  # Training hyperparameters
  num_epochs: 100
  batch_size: 512
  gamma: 0.9
  expectile: 0.95
  learning_rate: 1e-4
  hidden_dims: [256, 256]
  
  # Checkpoint settings
  save_checkpoint: true
  checkpoint_every_n_epochs: 10  # Save checkpoint every N epochs
  save_best_checkpoint: true  # Save best checkpoint based on validation metric
  
  # Evaluation settings
  eval_every_n_epochs: 10  # Evaluate policy every N epochs
  eval_episodes: 100  # Number of episodes for evaluation
  eval_after_training: false

action_sequence: 25
temporal_ensemble: true
use_standardization: false
use_min_max_normalization: true
min_max_margin: 0
norm_obs: true

seed: 1
action_repeat: 1
execution_length: 1

eval: false

wandb:
  use: true
  swanlab_use: true
  project: safe_iql_bigym
  name: safe_iql_bigym1_${env.task_name}
  mode: online

hydra:
  run:
    dir: ./exp_local/safe_iql/bigym1_${env.task_name}

