nodes: 2
tasks_per_node: 8
cpus_per_task: 16
mem_per_gpu: 210G
copy_code: false
folder: ${JEPAWM_LOGS}/droid_final_sweep/droid_4fpcs_fps4_r256_dv3vitl_asp1_pred_AdaLN_depth12_noprop_repro_2roll_4n
tag: online_gc_zeroshot/place_L2_cem_sourcedset_H3_nas1_maxnorm005_scaleact_repeat5_fskip5_max60_ctxt2_r256_alpha0_ep32_decode/epoch-315-plan-only
eval_name: simu_env_planning
meta:
  quick_debug: false
  seed: 1
  eval_episodes: 32
distributed:
  distribute_multitask_eval: true
  local_rng_samplers: true
  seed_shift: horizon_1000
logging:
  exp_name: gc_zeroshot_dist
  save_csv: true
  tqdm_silent: false
  optional_plots: true
model_kwargs:
  module_name: app.vjepa_wm.modelcustom.simu_env_planning.vit_enc_preds
  checkpoint: jepa-latest.pth.tar
  pretrain_kwargs:
    grid_size: 16
    tubelet_size_enc: 1
    use_activation_checkpointing: false
    action_conditioning: token
    proprio_encoding: none
    num_frames_pred: 4
    visual_encoder:
      enc_type: dino
      enc_version: dinov3_vitl16
      pretrain_enc_path:
      pretrain_enc_ckpt_key:
      embed_dim: 1024
      enc_use_rope:
      enc_name:
      use_sdpa_enc:
      num_frames_enc:
      uniform_power: true
    action_encoder:
      action_tokens: 1
      action_emb_dim: 0
      act_mlp: false
      action_encoder_inpred: true
    proprio_encoder:
      proprio_tokens: 0
      proprio_emb_dim: 0
      prop_mlp: false
      proprio_encoder_inpred: false
    predictor:
      tubelet_size: 1
      pred_num_heads: 16
      pred_depth: 12
      pred_embed_dim: 1024
      pred_use_extrinsics: false
      pred_type: AdaLN
      act_pred_projector:
      use_SiLU:
      use_rope: true
    wm_encoding:
      batchify_video: true
      dup_image: false
      normalize_reps: false
    rollout_cfg:
      rollout_steps: 2
      train_rollout_prefixes: random
      rollout_stop_gradient: true
      ctxt_window_train_rollout: 3
      do_parallel_rollout:
      do_sequential_rollout: true
      prepend_gt:
      sampling_scheduler:
        type: linear
        start: 0.0
        end: 0.0
    attn:
      local_window_time: 3
      local_window_h: -1
      local_window_w: -1
    heads_cfg:
      architectures:
        image_head:
          kind: vit
          config:
            patch_size: 8
            in_chans: 3
            img_size: [256, 256]
            embed_dim: 1024
            decoder_embed_dim: 1024
            depth: 24
            num_heads: 16
            mlp_ratio: 4.0
            num_views: 1
            use_activation_checkpointing: false
            use_lpips: true
            pixelloss_weight: 10
            perceptual_weight: 1
      pretrain_dec_path:
        image_head: ${JEPAWM_OSSCKPT}/vm2m_lpips_dv3vitl_256_INet.pth.tar
  data:
    dataset_type: custom
    datasets:
    - Robocasa
    datasets_weights:
    seed: 234
    img_size: 256
    validation:
      val_datasets:
      - Robocasa
      num_frames_val: 5
      val_dataset_batch_size: 4
      val_dataset_drop_last: false
      val_dataset_fpcs:
      - 5
      val_dataset_camera_views:
      - robot0_leftview
      val_viz_rank0_loader: true
      val_datasets_1:
        names:
        - Franka_hf
        batch_size: 4
        drop_last: false
        fps: 4
        fpcs:
        - 5
        camera_views:
        - exterior_image_2_left
    loader:
      batch_size: 8
      num_workers: 16
      pin_mem: true
      persistent_workers: true
    custom:
      split_ratio: 0
      frameskip: 5
      action_skip: 5
      state_skip: 1
      normalize_action: false
      traj_subset: true
      filter_first_episodes:
      filter_tasks:
      - PnPCounterTop
      num_hist: 7
      num_pred: 1
      with_reward:
      custom_teleop_dset: true
    droid:
      camera_frame:
      camera_views:
      - left_mp4_path
      droid_to_rcasa_action_format: 1
      rcasa_to_droid_action_format:
      fps: 4
      dataset_fpcs:
      - 4
      mpk_manifest_patterns:
      - '**/pick/liftcup_v0/run_0001/episode.h5'
      - '**/pick/pickandplaceredcube_v0/run_0001/episode.h5'
      - '**/pick/pickcube_v0/run_0001/episode.h5'
      - '**/pick/pickpen_v0/run_0001/episode.h5'
      - '**/pick/pickupcup_v0/run_0001/episode.h5'
      - '**/pick/reachcup_v0/run_0001/episode.h5'
      - '**/pick/reachliftcup_v0/run_0001/episode.h5'
      - '**/pick/reachliftcup_v1/run_0001/episode.h5'
      - '**/push/brownboxpush_v0/run_0001/episode.h5'
      - '**/push/push_various_objects/blue_bowl/episode.h5'
      - '**/push/push_various_objects/blue_box/episode.h5'
      - '**/push/push_various_objects/cap/episode.h5'
      - '**/push/push_various_objects/pengiun_plush/episode.h5'
      - '**/folding/foldjacketsleeve_v0/run_0001/episode.h5'
      - '**/folding/foldjacketsleeve_v1/run_0001/episode.h5'
  data_aug:
    auto_augment: false
    random_horizontal_flip: false
    motion_shift: false
    random_resize_aspect_ratio:
    - 1.0
    - 1.0
    random_resize_scale:
    - 1.777
    - 1.777
    reprob: 0.0
    normalize:
    - - 0.485
      - 0.456
      - 0.406
    - - 0.229
      - 0.224
      - 0.225
  wrapper_kwargs:
    ctxt_window: 2
    proprio_mode: predict_proprio
task_specification:
  task: robocasa-PnPCounterTop
  obs: rgb
  obs_concat_channels: false
  goal_source: dset
  succ_def: simu
  done_at_succ: false
  max_episode_steps: 60
  goal_last: true
  goal_H: 75
  replay_expert: false
  num_frames: 1
  num_proprios: 1
  img_size: 256
  env:
    with_target: true
    with_velocity: true
    freeze_rand_vec: false
    manip_only: true
    custom_task: false
    camera_name: robot0_leftview
    rescale_act_droid_to_rcasa: true
    subtask: place
    sample_subtask_slice: true
    reach_threshold: 0.2
    place_threshold: 0.15
planner:
  planner_name: cem
  iterations: 15
  num_samples: 300
  num_elites: 10
  horizon: 3
  var_scale: 0.1
  max_norms:
  - 0.05
  - 0.01
  - 1.0
  max_norm_dims:
  - - 0
    - 1
    - 2
  - - 3
    - 4
    - 5
  - - 6
  momentum_mean: 0.
  momentum_std: 0.
  num_act_stepped: 1
  repeat_actskip: true
  decode_each_iteration: true
  distribute_planner: false
  planning_objective:
    objective_type: L2
    sum_all_diffs: false
    alpha: 0
