project_name: v2i_fusion # This is used for logging into wandb
name: LiDAR-only

dataset: &dataset 'V2XSim' # V2XReal or V2XSim
root_dir: "/media/user/Dataset/V2X-Sim-Reformat/train"
validate_dir: "/media/user/Dataset/V2X-Sim-Reformat/test"
dataset_mode: 'v2i' # 'ic' or 'v2i'
img_format: 'npy' # 'jpeg' or 'npy'
modality:
  rsu_lidar: true
  rsu_camera: false
  cav_lidar: true
  cav_camera: false

yaml_parser: "load_bev_params"
train_params:
  batch_size: &batch_size 1
  epoches: &epoches 80
  eval_freq: 4
  save_freq: 1
  max_cav: &max_cav 3

fusion:
  core_method: 'IntermediateFusionDatasetV2XSim' # IntermediateFusionDatasetV2XReal, IntermediateFusionDatasetV2XSim
  args: []

# preprocess-related
preprocess:
  # options: BasePreprocessor, BevPreprocessor
  core_method: 'BevPreprocessor'
  args:
    res: &res 0.15 # discretization resolusion
    downsample_rate: &downsample_rate 4 # pixor downsample ratio
    bgr2rgb: true
    resize_x: &image_width 512
    resize_y: &image_height 512
    mean: [ 0.485, 0.456, 0.406 ]
    std: [ 0.229, 0.224, 0.225 ]
    voxel_size: &voxel_size [0.4, 0.4, 30]
  # lidar range for each individual cav.
  cav_lidar_range: &cav_lidar [ -38.4, -38.4, -10, 38.4, 38.4, 2 ]

data_augment: []

# anchor box related
postprocess:
  core_method: 'BevPostprocessor' # BevPostprocessor supported
  nms_thresh: 0.15
  anchor_args:
    cav_lidar_range: *cav_lidar
    res: *res
    downsample_rate: *downsample_rate # pixor downsample ratio
  target_args:
    score_threshold: 0.5
  order: 'lwh' # hwl or lwh
  max_num: 300 # maximum number of objects in a single frame. use this number to make sure different frames has the same dimension in the same batch

# model related
model:
  core_method: pixor_intermediate # rsu_modality_intermediate_plainfuse, cam_intermediate_fuse_single, pixor_intermediate

  args:
    dataset: *dataset
    header:
      dataset: *dataset
      feature_dim: 128
      use_bn: False
      decoder:
        input_dim: 128
        num_layer: 1
        num_ch_dec: [ 64 ]
      seg_dim:
        64
    decode: False
    point_pillar_scatter:
      num_features: 64

loss:
  core_method: segment_focal_loss
  args:
    gamma: 1.0 # 2.0
    seg_weight: 2.0

optimizer:
  core_method: AdamW
  lr: 2e-4 #0.0002
  args:
    eps: 1e-10 #1e-10
    weight_decay: 1e-2

lr_scheduler:
  core_method: cosineannealwarm #step, multistep, cosineannealwarm and Exponential support
  epoches: *epoches
  warmup_lr: 2e-5
  warmup_epoches: 10
  lr_min: 5e-6
