__include__: [
  '../../dataset/obj365_detection.yml',
  '../../runtime.yml',
  '../include/dataloader.yml',
  '../include/optimizer_obj365.yml',
  '../include/dfine_hgnetv2.yml',
]

output_dir: ../../../output/dfine_hgnetv2_x_obj365


DFINE:
  backbone: HGNetv2


HGNetv2:
  name: 'B5'
  return_idx: [1, 2, 3]
  freeze_stem_only: True
  freeze_at: 0
  freeze_norm: True

HybridEncoder:
  # intra
  hidden_dim: 384
  dim_feedforward: 2048

DFINETransformer:
  feat_channels: [384, 384, 384]
 
optimizer:
  type: AdamW
  params: 
    - 
      params: '^(?=.*backbone)(?!.*norm|bn).*$'
      lr: 0.000004
    - 
      params: '^(?=.*(?:encoder|decoder))(?=.*(?:norm|bn)).*$'
      weight_decay: 0.

  lr: 0.0004
  betas: [0.9, 0.999]
  weight_decay: 0.00005

epoches: 36 # Early stop

DFINECriterion:
  end_epoch: 36

train_dataloader: 
  dataset: 
    transforms:
      policy:
        epoch: 500
  collate_fn:
    stop_epoch: 500
    scale_ori_repeat: 3

ema:
  decay: 0.9998

DFINECriterion:
  weight_dict: {loss_vfl: 1, loss_bbox: 5, loss_giou: 2, loss_dfl: 0.1, loss_local: 1.0}

checkpoint_freq: 1