defaults:
  - default
  - dataset: sequence
  - backbone: dit
  - algorithm: flow
  - env: walker2d
  - _self_

dataset:
  use_padding: false

env:
  use_cpx: 0

trainer:
  _target_: src.utils.training.Trainer
  device: ${device}
  ema_decay: 0.995
  train_batch_size: 64
  train_lr: 1e-4
  gradient_accumulate_every: 1
  step_start_ema: 2000
  update_ema_every: 10
  log_freq: 500
  save_freq: 200000
  label_freq: ${trainer.save_freq}
  save_parallel: false
  
# 不加 guide policy config
policy:
  _target_: src.sampling.policies.GuidedPolicy
  # diffusion_model: null
  # normalizer: null
  preprocess_fns: []
  # sampling kwargs
  # sample_fn: src.sampling.functions.n_step_guided_p_sample
  # n_guide_steps: 2
  # t_stopgrad: 2
  # scale_grad_by_std: true

val_dataloader:
  _target_: torch.utils.data.DataLoader
  batch_size: ${eval.samples}
  shuffle: true

eval:
  samples: 200   # 计算分布差异时，采样多少个horizon
  # rollout
  n_episodes: 10  # rollout 多少条轨迹
  seed: ${seed}
  is_video: true
  video_episodes: 2

  check_index_list: [0, 1, 2, 3, 4, 5, 6, 7] # 在计算平滑度时考虑哪些维度


env_name: walker2d
algo_name: flow
run_name: train


device: "cuda:2"
seed: 42
dataset_minari_name: "mujoco/walker2d/medium-v0"
horizon: 100  # 如果要使用 unet 要保证 horizon 能够被8整除
max_seq: 1000
obs_dim: 17
act_dim: 6
transition_dim: 23
cond_dim: 17
steps: 200  # 采样步数

iteration: 1000000  # 训练step

