name: SDv1.5mv-rawbox-t
pretrained_model_name_or_path: /dzy/Code/stable-diffusion-v1-5/

bbox_mode: 'all-xyz'
bbox_view_shared: false
crossview_attn_type: basic
train_with_same_noise: false
train_with_same_t: true

# temporal
animatediff_file: /datadrive/ckpt/Animatediff/mm_sd_v15_v2.ckpt
load_pretrain_from: null
allow_partial_load: false
pretrained_magicdrive: /home/qid/duzhiying/nuscenes/ckpt/magicdrive-t-log/epoch1
# unet_plus_animatediff: /home/qid/duzhiying/nuscenes/ckpt/magicdrive-t-log/SDv1.5mv-rawbox-t_2024-08-07_13-11_2.0t_0.4.4/weight-E1-S19348
train_with_same_noise_t: false
video_length: 16
sc_attn_index:
  - [0, 0]  # keyframe
  - [0, 0]
  - [0, 1]
  - [0, 2]
  - [0, 3]
  - [0, 4]
  - [0, 5]  # keyframe

runner_module: magicdrive.runner.multiview_t_runner.MultiviewTRunner

pipe_module: magicdrive.pipeline.pipeline_bev_controlnet_t.StableDiffusionBEVControlNetTPipeline

unet_module: magicdrive.networks.unet_2d_condition_multiview_t.UNet2DConditionModelMultiviewT
use_fp32_for_unet_trainable: true
# unet_dir: checkpoint-4/unet
# unet_dir: checkpoint-5000/unet
unet_dir: checkpoint-25000/checkpoint-60000/weight-E1-S19348/unet
lora_dir: lora.pt

unet:
  video_length: ${..video_length}
  temp_attn_type: t_last
  temp_pos_emb: learnable
  zero_module_type2: zero_linear
  spatial_trainable: false

  use_motion_module:          true
  motion_module_resolutions:  [1,2,4,8]
  motion_module_mid_block:    true
  motion_module_type:         "Vanilla"

  motion_module_kwargs:
    num_attention_heads:        8
    num_transformer_block:      1
    attention_block_types:      [ "Temporal_Self", "Temporal_Self" ]
    temporal_position_encoding: true
    temporal_attention_dim_div: 1
    zero_initialize:            true

model_module: magicdrive.networks.unet_addon_rawbox.BEVControlNetModel
controlnet_dir: controlnet
controlnet: {}

trainable_modules:
  - "motion_modules."
  - "attn1.to_q"