# @package _global_

run_name: "${optional_:${prefix}}\
  ${arch_name}\
  _${task_name}\
  _To${num_latest_obs}\
  _Ta${action_prediction_horizon}\
  _b${bs}\
  ${__optional:${suffix}}\
  ${_optional:${postsuffix}}"

arch_name: wbvima_sim_1st_view_large

# ====== DP specific ======
num_latest_obs: 2
action_prediction_horizon: 8

wd: 0.1
no_pcd: False
flash_attention: False
task_space_action: False
reweight_traj: False
random_shuffle_chunks: True
demo_wise_train_val_split: True
limit_demo_num: 1000
no_pcd_color: False

# ------ module ------
module:
  _target_: brs_algo.learning.module.DiffusionModule
  reweight_traj: ${reweight_traj}
  policy:
    _target_: brs_algo.learning.policy.WBVIMAPolicy
    prop_dim: 21
    prop_keys: ["odom/base_velocity", "qpos/torso", "qpos/left_arm", "qpos/left_gripper", "qpos/right_arm", "qpos/right_gripper"]
    num_latest_obs: ${num_latest_obs}
    no_pcd: ${no_pcd}
    no_pcd_color: ${no_pcd_color}
    flash_attention: ${flash_attention}
    task_space_action: ${task_space_action}
    use_modality_type_tokens: false
    prop_mlp_hidden_depth: 2
    prop_mlp_hidden_dim: 256
    pointnet_n_coordinates: 3
    pointnet_n_color: 3
    pointnet_hidden_depth: 3
    pointnet_hidden_dim: 512
    action_keys: ${action_keys}
    action_key_dims: ${action_key_dims}
    # ====== Transformer ======
    xf_n_embd: 1024
    xf_n_layer: 6
    xf_n_head: 8
    xf_dropout_rate: 0.1
    xf_use_geglu: true
    # ====== Action Decoding ======
    learnable_action_readout_token: false
    action_dim: 21
    action_prediction_horizon: ${action_prediction_horizon}
    diffusion_step_embed_dim: 512
    unet_down_dims: [128,256,512]
    unet_kernel_size: 5
    unet_n_groups: 8
    unet_cond_predict_scale: true
    # ====== diffusion ======
    noise_scheduler:
      _target_: diffusers.schedulers.scheduling_ddim.DDIMScheduler
      num_train_timesteps: 100
      beta_start: 0.0001
      beta_end: 0.02
      # beta_schedule is important
      # this is the best we found
      beta_schedule: squaredcos_cap_v2
      clip_sample: True
      set_alpha_to_one: True
      steps_offset: 0
      prediction_type: epsilon # or sample
    noise_scheduler_step_kwargs: null
    num_denoise_steps_per_inference: 16
  action_prediction_horizon: ${action_prediction_horizon}
  loss_on_latest_obs_only: false

data_module:
  _target_: brs_algo.learning.data.ActionSeqChunkDataModule
  obs_window_size: ${num_latest_obs}
  action_prediction_horizon: ${action_prediction_horizon}
  sim_data: True
  no_pcd: ${no_pcd}
  task_space_action: ${task_space_action}
  demo_wise_train_val_split: ${demo_wise_train_val_split}
  random_shuffle_chunks: ${random_shuffle_chunks}
  limit_demo_num: ${limit_demo_num}
  no_pcd_color: ${no_pcd_color}
