# @package _global_

diffuser:
  dir: /output/hydra_log/RL_Diffuser_Debug/multiruns/2023-09-15_04-01-29_903351/0 # most often used, seems on 4edge
  # dir: /output/hydra_log/RL_Diffuser_Debug/multiruns/2023-09-16_17-16-54_339154/0 # second choice
  # dir: /output/hydra_log/RL_Diffuser_Debug/multiruns/2023-09-21_04-13-28_616262/0 # after retrain with maze 100000
  # dir: /output/hydra_log/RL_Diffuser_Debug/multiruns/2023-09-26_02-36-50_328692/0
  epoch: last

policy:
  _target_: diffuser.sampling.GuidedPolicy
  _partial_: true
  # guide: in python
  # diffusion_model: in python
  # normalizer:  in python
  preprocess_fns: []
  # the following are **sample_kwargs
  sample_fn: 
    # _target_: diffuser.sampling.n_step_guided_p_sample
    _target_: diffuser.sampling.n_step_guided_p_sample_freedom_timetravel
    _partial_: true
  scale: 0.0
  n_guide_steps: 1 # ! does not used, only use one step + time travel
  t_stopgrad: 2 # positive: grad[t < t_stopgrad] = 0; bigger is noise
  # grad_interval: [0.4,0.7]
  # grad_interval: [0.05, 1.0]
  grad_interval: [0.0, 1.0]
  scale_grad_by_std: true
  travel_repeat: 2 # time travel
  travel_interval: [0.3,0.7] # if float, would use [horizon*travel_interval, horizon]

mode: default # default: would only run once. local: would sweep over scale_list and guide_list

sample_num: 100
save_dir: ./debug/plot_maze
scale: 100
guide: 
  _target_: diffuser.sampling.Maze2dAvoidGuide
  target: [0.0, .0] # (3, 3)
  radius: 1.0
  distance_type: l2
  # target: [0.0457, 0.0458] # (3, 3)
  # target: [-0.8800, 0.5086] # (1, 4)
  # target: [-0.4172, -0.8800] # (2, 1)
  # target: [0.9714, -0.4171] # (5, 2)
  # target: [0.5086, 0.9714] # (4, 5)
# scale_list: [10.0, 100, 400, 1000, -10.0, -100, -400, -1000]
scale_list: [ 0.0, 10, 100, 200, 300, 400, 1000, 2000, 4000, 10000]
# scale_list: [100000, -100000]
# scale_list: [1.0,0.1,0.01,0.001]
guide_list: 
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [0.0457, 0.0458] # (3, 3)
  #   distance_type: l2
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [-0.9714, 0.5086] # (1, 5)
  #   distance_type: l2
  # - _target_: diffuser.sampling.Maze2dTargetXGuide
  #   target: -0.0 # (1, 4)
  #   distance_type: l2
  # - _target_: diffuser.sampling.Maze2dTargetYGuide
  #   target: 1.0 # (1, 4)
  #   distance_type: l2
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [-0.4172, -0.8800] # (2, 1)
  #   distance_type: l2
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [0.9714, -0.4171] # (5, 2)
  #   distance_type: l2
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [0.5086, 0.9714] # (4, 5)
  #   distance_type: l2
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [4.57, 4.58] # (3, 3)
  # - _target_: diffuser.sampling.Maze2dAvoidGuide
  #   target: [-0.8800, 0.5086] # (1, 4)
  #   radius: 0.5
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [-0.8800, 0.5086] # (1, 4)
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [0.9714, -0.4171] # (5, 2)
  # - _target_: diffuser.sampling.Maze2dTargetGuide
  #   target: [0.5086, 0.9714] # (4, 5)
  # - _target_: diffuser.sampling.NoTrainGuideDirection
  #   target: [0.0, 0.0] # (3, 3)
  # - _target_: diffuser.sampling.NoTrainGuideXLower
  # - _target_: diffuser.sampling.NoTrainGuideXHigher
  # - _target_: diffuser.sampling.NoTrainGuideYLower
  # - _target_: diffuser.sampling.NoTrainGuideYHigher
  # - _target_: diffuser.sampling.NoTrainGuideEndXLower
  # - _target_: diffuser.sampling.NoTrainGuideEndXHigher
  # - _target_: diffuser.sampling.NoTrainGuideEndYLower
  # - _target_: diffuser.sampling.NoTrainGuideEndYHigher
  # - _target_: diffuser.sampling.NoTrainGuideShorter
  # - _target_: diffuser.sampling.NoTrainGuideLonger
  # - _target_: diffuser.sampling.DummyGuide
  - _target_: diffuser.sampling.MultiGuide
    guides:
      # - weight: 1.0
      #   guide:
      #     _target_: diffuser.sampling.NoTrainGuideXHigher
      - weight: 1.0
        guide:
          _target_: diffuser.sampling.NoTrainGuideEndYHigher
      - weight: 0.03
        guide:
          _target_: diffuser.sampling.NoTrainGuideShorter
      # - weight: 1.0
      #   guide:
      #     _target_: diffuser.sampling.NoTrainGuideXLower
      # - weight: 10.0
      #   guide:
      #     _target_: diffuser.sampling.Maze2dAvoidGuide
      #     target: [-0.5457, 0.0458] # (3, 3)
      #     radius: 0.15


runner:
  _target_: src.runner.PlotMazeRunner
  _partial_: true

wandb:
  mode: online

seed: 0

# common - for all tasks (task_name, tags, output_dir, device)
algorithm_name: "DefaultAlgName"
task_name: "PlotMaze"
tags: ["debug"]

# Notes
# yhigher scale=10效果不错，挺分散的