defaults:
  - default
  - dataset: sequence
  - backbone: unet
  - algorithm: diffusion
  - env: walker2d
  - _self_

backbone:
  dim: 64

env:
  use_cpx: ${use_cpx}
  vel_scale: ${vel_scale}  
  height_limit: ${height_limit}
  height_min: ${height_min}
  v_max: ${v_max}
  v_min: ${v_min}

algorithm:
  env_name: "walker2d_cpx2"
  safe_method: "RoS"
  height_limit: ${height_limit}
  vel_scale: ${vel_scale}
  height_min: ${height_min}
  v_max: ${v_max}
  v_min: ${v_min}
  obs_vel_idx: 9
  
# 不加 guide policy config
policy:
  _target_: src.sampling.policies.GuidedPolicy
  preprocess_fns: []

val_dataloader:
  _target_: torch.utils.data.DataLoader
  batch_size: ${eval.samples}
  shuffle: true

eval:
  load_model_path: "outputs/walker2d/diffusion_train_horizon160/42_2026-01-07_14-21-46/state_final.pt"
  samples: 200   # 计算分布差异时，采样多少个horizon
  # rollout
  n_episodes: 10  # rollout 多少条轨迹
  seed: ${seed}
  is_video: true
  video_episodes: 2
  skip_rollout: true

  check_index_list: [0, 1, 2, 3, 4, 5, 6, 7] # 在计算平滑度时考虑哪些维度


env_name: walker2dcpx2
algo_name: RoS
run_name: time_horizon160


device: "cuda:0"
seed: 42
dataset_minari_name: "mujoco/walker2d/medium-v0"
horizon: 160  # 如果要使用 unet 要保证 horizon 能够被8整除
max_seq: 1000
obs_dim: 17
act_dim: 6
transition_dim: 23
cond_dim: 17
steps: 20  # diffusion 扩散步

height_limit: 1.35
vel_scale: 0.01
height_min: 0.9
v_max: 1.4
v_min: -1.4
use_cpx: 2


