__include__: [
  '../../dataset/obj365_detection.yml',
  '../../runtime.yml',
  '../include/dataloader.yml',
  '../include/optimizer_obj365.yml',
  '../include/dfine_hgnetv2.yml',
]

output_dir: ../../../output/dfine_hgnetv2_s_obj365


DFINE:
  backbone: HGNetv2


HGNetv2:
  name: 'B0'
  return_idx: [1, 2, 3]
  freeze_at: -1
  freeze_norm: False
  use_lab: True

DFINETransformer:
  num_layers: 3
  eval_idx: -1

HybridEncoder:
  in_channels: [256, 512, 1024]
  hidden_dim: 256
  depth_mult: 0.34
  expansion: 0.5
  
optimizer:
  type: AdamW
  params: 
    - 
      params: '^(?=.*backbone)(?!.*norm|bn).*$'
      lr: 0.0002
    - 
      params: '^(?=.*backbone)(?=.*norm|bn).*$'
      lr: 0.0002
      weight_decay: 0.
    - 
      params: '^(?=.*(?:encoder|decoder))(?=.*(?:norm|bn|bias)).*$'
      weight_decay: 0.

  lr: 0.0004
  betas: [0.9, 0.999]
  weight_decay: 0.00005

epoches: 36 # Early stop

DFINECriterion:
  end_epoch: 36

train_dataloader: 
  dataset: 
    transforms:
      policy:
        epoch: 500
  collate_fn:
    stop_epoch: 500
    scale_ori_repeat: 10

ema:
  decay: 0.9998

DFINECriterion:
  weight_dict: {loss_vfl: 1, loss_bbox: 5, loss_giou: 2, loss_dfl: 0.1, loss_local: 1.0}

checkpoint_freq: 1