_target_: consistency_policy.rollout_d4rl.rollout_teacher_d4rl_workspace.EDMRolloutD4RLWorkspace
exp_name: default
ema:
  _target_: diffusion_policy.model.diffusion.ema_model.EMAModel
  inv_gamma: 1.0
  max_value: 0.9999
  min_value: 0.0
  power: 0.75
  update_after_step: 0
horizon: 16
keypoint_visible_rate: 1.0
logging:
  group: null
  id: null
  mode: online
  name: 2022.12.29-22.31.30_train_diffusion_unet_hybrid_square_image
  project: diffusion_policy_debug
  resume: false
  tags:
  - rollout_diffusion_unet
  - d4rl
  - default
multi_run:
  run_dir: data/outputs/2022.12.29/22.31.30_train_diffusion_unet_hybrid_square_image
  wandb_name_base: 2022.12.29-22.31.30_train_diffusion_unet_hybrid_square_image
n_action_steps: 1
n_latency_steps: 0
n_obs_steps: 1
name: rollout_student_d4rl
obs_as_global_cond: true
past_action_visible: false
policy:
  _target_: consistency_policy.teacher_d4rl.edm_policy_d4rl.KarrasUnetHybridD4RLPolicy
  inference_mode: none # this will be populated automatically from training.inference_mode, do not set it here
  cond_predict_scale: true
  diffusion_step_embed_dim: 128
  down_dims:
  - 512
  - 1024
  - 2048
  horizon: 16
  kernel_size: 5
  n_action_steps: 1
  n_groups: 8
  n_obs_steps: 1
  delta: -1
  # delta: 0
  noise_scheduler:
    _target_: consistency_policy.diffusion.Karras_Scheduler
    time_min: 0.02
    time_max: 80.0
    rho: 7.0
    bins: 80
    solver: heun
    time_sampler: log_normal
    scaling: boundary
    use_c_in: true
    data_std: .5
    clamp: true
    name: heun80
  obs_as_global_cond: true
  shape_meta:
    action:
      shape:
      - 3
    observation:
      shape: 
      - 11
shape_meta:
  action:
    shape:
    - 3
  observation:
    shape: 
    - 11
task:
  abs_action: true
  env_runner:
    _target_: diffusion_policy.env_runner.d4rl_lowdim_runner.D4RLLowdimRunner
    env_name: 'hopper-medium-expert-v2'
    crf: 22
    fps: 10
    max_steps: 1000
    n_action_steps: 1
    n_envs: 1
    n_obs_steps: 1
    n_test: 1
    n_test_vis: 1
    n_train: 0
    n_train_vis: 2
    past_action: false
    test_start_seed: 100000
    tqdm_interval_sec: 1.0
  name: d4rl_hopper_medium_expert
  shape_meta:
    action:
      shape:
      - 3
    observation:
      shape: 
      - 11
  task_name: d4rl_hopper_medium_expert
task_name: d4rl_hopper_medium_expert
training:
  inference_mode: true
  online_rollouts: true
  device: cuda:0
  load_path: ./Diffusion/outputs/edm/d4rl_hopper_medium_replay/checkpoints/epoch=0600-train_loss=0.030.ckpt
  # load_path: ./Diffusion/outputs/edm/d4rl_hopper_medium_expert/checkpoints/epoch=0100-test_mean_scores=1.296.ckpt
  # load_path: ./Diffusion/outputs/edm/d4rl_hopper_medium_expert/checkpoints/epoch=0300-test_mean_scores=1.272.ckpt
  seed: 42
  use_ema: true
  val_chaining_steps: 1
  output_dir: ./Diffusion/outputs/edm/d4rl_hopper_medium_expert