model:
  NAME: PTSegV3_Balance_Main
  in_channels: 6
  enable_hefm: False
  use_prev_softmax_guidance: True
  beta: 0.999 # 0.999
  grid_size: 0.02
  num_classes_per_level: [4, 13]
  encoder_kwargs:
    enable_flash: False      # 关闭 Flash-Attention，以便启用 RPE
    enable_rpe:   True       # 相对位置偏置
    upcast_attention: True   # q,k 点积用 fp32，提高数值稳定性
    enc_patch_size: [128, 128, 128, 128, 128]
    dec_patch_size: [128, 128, 128, 128]
    upcast_softmax: True
model_prior:
  NAME: PTSegV3_Balance_Prior
  in_channels: 6
  beta: 0.999
  grid_size: 0.02
  encoder_kwargs:
    enable_flash: False
    enable_rpe:   True
    upcast_attention: True
    enc_patch_size: [128, 128, 128, 128, 128]
    dec_patch_size: [128, 128, 128, 128]
    upcast_softmax: True

prior_active: [0, 1]
epochs: 100
batch_size: 64 # 2 for PTv2; 4 for PTv1

dataset:
  common:
    NAME: Urban3DSegBase
    cfg_dir: /root/autodl-tmp/PointSegBase-main/configs/pointnet_urban_layer_all
    set_name: TRAIN
  train:
    set_name: TRAIN
  val:
    set_name: VALIDATION
  test:
    set_name: TEST

dataloader:
  num_workers: 16

datatransforms: {}

criterion:
  NAME: CrossEntropy
  label_smoothing: 0.2
criterion_SupCon:
  NAME: SupConLoss
  temperature: 0.07
consistency_loss:
  enable: False
  matrices_file: /root/autodl-tmp/PointSegBase-main/configs/pointnet_urban_layer_all/data_list/matrix_file_list.yaml
  mode: inter
  weight: 1.0

optimizer:
  NAME: 'adamw'  # performs 1 point better than adam
  weight_decay: 0.05

# lr_scheduler2:
sched: cosine
warmup_epochs: 0
min_lr: 1.0e-5
lr: 0.0002  # start LR (= first max_lr / div_factor)

sched_params:
  max_lr: [0.002, 0.0002]
  pct_start: 0.05
  anneal_strategy: cos
  div_factor: 10.0
  final_div_factor: 1000.0

# loss_weight
loss_prior: 1.0
loss_prior_supcon: 1.0
loss_main_l1: 1.0
loss_main_ce: 1.0
