pipeline_name: cdp_realworld_image

# env
env_name: realworld_image_eef_pos
abs_action: false
dataset_path: data/frankastack_fix.hdf5
mode: train
max_episode_steps: 400

shape_meta:
  action:
    shape:
    - 7
  obs:
    agentview:
      shape:
      - 3
      - 224
      - 224
      type: rgb
    ee_pos:
      shape:
      - 3
      type: low_dim
    gripper_state:
      shape:
      - 1
      type: low_dim

action_dim: 7
obs_steps: 4
action_steps: 2

# diffusion
diffusion: edm # or csde for cdp
solver: euler

# DiT specific args
embedding_dim: 256 # image embedding dimension
d_model: 320 # transformer model dimension
n_heads: 10 # number of attention heads
depth: 2 # number of transformer blocks

# obs_encoder
rgb_model: resnet18
rgb_weights: IMAGENET1K_V1
resize_shape: null
crop_shape:
  - 224
  - 224
random_crop: false
use_group_norm: true
use_seq: true

# train
device: cuda:0
seed: 0
gradient_steps: 1000000
batch_size: 64
horizon: 4
nn: dit
val_ratio: 0.05
sample_steps: 50
temperature: 1.0
diffusion_x: false
extra_sample_steps: 8

# optimizer
lr: 0.0001

# log
exp_name: ${env_name}_${diffusion}_${nn}
save_path: logs
project: tactile-rep
group: dbc_realworld_image
wandb_mode: online
log_freq: 5000
save_freq: 20000
log_dir: logs

# eval
model_path: ckpt/dbc_stack_o4_a2_h4/model_200000.pt

# hydra
hydra:
  job:
    chdir: false
  run:
    dir: ${log_dir}/${pipeline_name}/${env_name}/hydra/${seed}
  output_subdir: null
