_target_: consistency_policy.rollout_d4rl.rollout_ddim_maze_workspace.DDIMRolloutMazeWorkspace
exp_name: default
ema:
  _target_: diffusion_policy.model.diffusion.ema_model.EMAModel
  inv_gamma: 1.0
  max_value: 0.9999
  min_value: 0.0
  power: 0.75
  update_after_step: 0

# horizon: 128
# horizon: 256
horizon: 384

keypoint_visible_rate: 1.0
logging:
  group: null
  id: null
  mode: online
  name: dp_test
  project: diffusion_policy_debug
  resume: false
  tags:
  - train_diffusion_unet_maze_large
  - maze2d_ddim
  - default
multi_run:
  run_dir: data/outputs/2022.12.29/22.31.27_train_diffusion_unet_hybrid_square_image
  wandb_name_base: dp_test

# n_action_steps: 128
# n_action_steps: 256
n_action_steps: 384

n_latency_steps: 0
n_obs_steps: 2
name: rollout_maze_ddim
obs_as_global_cond: true
past_action_visible: false
policy:
  _target_: diffusion_policy.policy.diffusion_unet_lowdim_policy_maze2d.DiffusionUnetLowdimMazePolicy
  # inference_mode: none # this will be populated automatically from training.inference_mode, do not set it here
  cond_predict_scale: true

  # diffusion_step_embed_dim: 256
  # down_dims:
  # - 256
  # - 512
  # - 1024

  # diffusion_step_embed_dim: 256
  # down_dims:
  # - 512
  # - 1024
  # - 2048

  diffusion_step_embed_dim: 256
  down_dims:
  - 256
  - 512
  - 1024
  - 2048

  # horizon: 128
  # horizon: 256
  horizon: 384
  
  # n_action_steps: 128
  # n_action_steps: 256
  n_action_steps: 384
  

  kernel_size: 5
  n_groups: 8
  n_obs_steps: 2
  delta: -1
  noise_scheduler:
    # _target_: consistency_policy.diffusion.Karras_Scheduler
    # time_min: 0.02
    # time_max: 80.0
    # rho: 7.0
    # bins: 80
    # solver: heun
    # time_sampler: log_normal
    # scaling: boundary
    # use_c_in: true
    # data_std: .5
    # clamp: true
    # name: heun80
    _target_: diffusers.schedulers.scheduling_ddim.DDIMScheduler
    num_train_timesteps: 100
    beta_start: 0.0001
    beta_end: 0.02
    beta_schedule: squaredcos_cap_v2
    clip_sample: True
    set_alpha_to_one: True
    steps_offset: 0
    prediction_type: epsilon # or sample
  num_inference_steps: 1
  obs_as_global_cond: true
  shape_meta:
    action:
      shape:
      - 2
    observation:
      shape: 
      - 4
shape_meta:
    action:
      shape:
      - 2
    observation:
      shape: 
      - 4
task:
  abs_action: true
  dataset:
    _target_: diffusion_policy.dataset.d4rl_dataset.D4RLDataset
    env_name: 'maze2d-large-v1'

    # horizon: 128
    # horizon: 256
    horizon: 384

    pad_after: 0
    pad_before: 0
    seed: 42
    val_ratio: 0.02
  env_runner:
    _target_: diffusion_policy.env_runner.maze2d_lowdim_state_runner.Maze2dLowdimStateRunner
    env_name: 'maze2d-large-v1'
    crf: 22
    fps: 10
    max_steps: 1000

    # n_action_steps: 128
    # n_action_steps: 256
    n_action_steps: 384

    n_envs: 1
    n_obs_steps: 2
    n_test: 100
    n_test_vis: 16
    n_train: 2
    n_train_vis: 2
    past_action: false
    test_start_seed: 100000
    tqdm_interval_sec: 1.0
  name: d4rl_maze_ddim
  shape_meta:
    action:
      shape:
      - 2
    observation:
      shape: 
      - 4
  task_name: d4rl_maze_ddim
task_name: d4rl_maze_ddim
training:
  inference_mode: false # Setting this to true disables the teacher, warm start, and training loop
  online_rollouts: true # Setting this to false disables the env_runner
  device: cuda:0

  # load_path: ./Diffusion/outputs/ddim/d4rl_maze_sm/checkpoints/latest.ckpt
  # load_path: ./Diffusion/outputs/ddim/d4rl_maze_med/checkpoints/epoch=0010-train_mse_error=1.210.ckpt
  load_path: ./Diffusion/outputs/ddim/d4rl_maze_lg/checkpoints/epoch=0005-train_mse_error=2.627.ckpt

  seed: 42
  use_ema: true
  # output_dir: ./Diffusion/outputs/ddim/d4rl_maze_sm
  # output_dir: ./Diffusion/outputs/ddim/d4rl_maze_med
  output_dir: ./Diffusion/outputs/ddim/d4rl_maze_lg


## large: 384  medium: 256  umaze: 128