_target_: diffusion_policy.workspace.train_diffusion_transformer_hybrid_workspace.TrainDiffusionTransformerHybridWorkspace
task_name: sim_transfer_cube_scripted
n_action_steps: 8
horizon: 10
n_demo: 4
n_eval: 50
seed: 42
test_start_seed: 100000
checkpoint:
  save_last_ckpt: true
  save_last_snapshot: false
  topk:
    format_str: epoch={epoch:04d}-test_mean_score={test_mean_score:.3f}.ckpt
    k: 5
    mode: max
    monitor_key: test_mean_score
dataloader:
  batch_size: 32
  num_workers: 8
  persistent_workers: false
  pin_memory: true
  shuffle: true
dataset_obs_steps: 2
ema:
  _target_: diffusion_policy.model.diffusion.ema_model.EMAModel
  inv_gamma: 1.0
  max_value: 0.9999
  min_value: 0.0
  power: 0.75
  update_after_step: 0
exp_name: default
keypoint_visible_rate: 1.0
logging:
  group: null
  id: null
  mode: online
  name: baseline_${task_name}_action_${n_action_steps}_horizon_${horizon}_${n_demo}_demo_train_diffusion_transformer_hybrid_aloha_image
  project: diffusion_policy_debug
  resume: true
  tags:
  - train_diffusion_transformer_hybrid
  - aloha
  - ${task_name}
  - default
multi_run:
  run_dir: data/outputs/2023.01.04/04.00.54_train_diffusion_transformer_hybrid_can_image
  wandb_name_base: 2023.01.04-04.00.54_train_diffusion_transformer_hybrid_can_image
n_latency_steps: 0
n_obs_steps: 2
name: train_diffusion_transformer_hybrid
obs_as_cond: true
optimizer:
  betas:
  - 0.9
  - 0.95
  learning_rate: 0.0001
  obs_encoder_weight_decay: 1.0e-06
  transformer_weight_decay: 0.001
past_action_visible: false
policy:
  _target_: diffusion_policy.policy.diffusion_transformer_hybrid_image_policy.DiffusionTransformerHybridImagePolicy
  causal_attn: true
  crop_shape: null # crop?
  eval_fixed_crop: true
  horizon: ${horizon}
  n_action_steps: ${n_action_steps}
  n_cond_layers: 0
  n_emb: 256
  n_head: 4
  n_layer: 8
  n_obs_steps: ${n_obs_steps}
  noise_scheduler:
    _target_: diffusers.schedulers.scheduling_ddpm.DDPMScheduler
    beta_end: 0.02
    beta_schedule: squaredcos_cap_v2
    beta_start: 0.0001
    clip_sample: true
    num_train_timesteps: 100
    prediction_type: epsilon
    variance_type: fixed_small
  num_inference_steps: 100
  obs_as_cond: true
  obs_encoder_group_norm: true
  p_drop_attn: 0.3
  p_drop_emb: 0.0
  shape_meta:
    action:
      shape:
      - 14
    obs:
      images:
        shape:
        - 3
        - 480
        - 640
        type: rgb
      qpos:
        shape:
        - 14
  time_as_cond: true
shape_meta:
  action:
    shape:
    - 14
  obs:
    images:
      shape:
      - 3
      - 480
      - 640
      type: rgb
    qpos:
      shape:
      - 14
task:
  abs_action: true
  dataset:
    _target_: diffusion_policy.dataset.aloha_image_dataset.AlohaImageDataset
    dataset_dir: data/act/${task_name}
    horizon: ${horizon}
    n_obs_steps: ${n_obs_steps}
    pad_after: ${eval:'${n_action_steps} - 1'}
    pad_before: 1
    seed: ${seed}
    shape_meta:
      action:
        shape:
        - 14
      obs:
        images:
          shape:
          - 3
          - 480
          - 640
          type: rgb
        qpos:
          shape:
          - 14
    val_ratio: ${eval:'1 - ${n_demo} / 50.0'}
    camera_names: ['top']
    num_episodes: 50
    use_keyframe: false
    constant_keyframe: null
    use_cache: false
  dataset_path: data/act/${task_name}
  dataset_type: ph
  env_runner:
    _target_: diffusion_policy.env_runner.aloha_image_runner.AlohaImageRunner
    crf: 22
    fps: 10
    max_steps: 400
    n_action_steps: ${n_action_steps}
    n_envs: ${n_eval}
    n_obs_steps: ${n_obs_steps}
    n_test: ${n_eval}
    n_test_vis: 4
    n_train: 0
    n_train_vis: 0
    multiplier: 1
    past_action: false
    test_start_seed: ${test_start_seed}
    tqdm_interval_sec: 1.0
    task_name: ${task_name}
  name: ${task_name}
  shape_meta:
    action:
      shape:
      - 14
    obs:
      images:
        shape:
        - 3
        - 480
        - 640
        type: rgb
      qpos:
        shape:
        - 14
  task_name: ${task_name}
training:
  checkpoint_every: 100
  debug: false
  device: cuda:0
  gradient_accumulate_every: 1
  lr_scheduler: cosine
  lr_warmup_steps: 1000
  max_train_steps: null
  max_val_steps: null
  num_epochs: 3500
  resume: true
  rollout_every: 100
  sample_every: 5
  seed: ${seed}
  tqdm_interval_sec: 1.0
  use_ema: true
  val_every: 5
val_dataloader:
  batch_size: 32
  num_workers: 8
  persistent_workers: false
  pin_memory: true
  shuffle: false
