DATA:
  MAX_SAMPLE_INTERVAL: 400
  MEAN:
  - 0.485
  - 0.456
  - 0.406
  STD:
  - 0.229
  - 0.224
  - 0.225
  SEARCH:
    CENTER_JITTER: 4.5
    FACTOR: 5.0
    SCALE_JITTER: 0.5
    SIZE: 384
    NUMBER: 2
  TEMPLATE:
    CENTER_JITTER: 0
    FACTOR: 2.0
    SCALE_JITTER: 0
    SIZE: 192
    NUMBER: 3
  TOKENFD_SIZE: 448

  TRAIN:
    DATASETS_NAME:
    # - LASOT
    # - GOT10K_vottrain
    # - COCO17
    # - TRACKINGNET
    - ARTVIDEOSOT_TRAIN
    - DSTEXTSOT_TRAIN
    - BOVTEXTSOT_TRAIN
    DATASETS_RATIO:
    - 1
    - 1
    - 1
    # - 1
    # - 1
    SAMPLE_PER_EPOCH: 30000
  VAL:
    DATASETS_NAME:
    # - GOT10K_votval
    - ARTVIDEOSOT_VAL
    - DSTEXTSOT_VAL
    - BOVTEXTSOT_VAL
    DATASETS_RATIO:
    # - 1
    - 1
    - 1
    - 1
    SAMPLE_PER_EPOCH: 5000
MODEL:
  PRETRAIN_FILE: ""
  TEXT_BACKBONE:
    CHECKPOINT: "" 
  FUSION:
    EMBED_DIM: 256  
    NUM_HEADS: 8    
  EXTRA_MERGER: False
  RETURN_INTER: False
  BACKBONE:
    TYPE: vit_base_patch16_224_ce
    STRIDE: 16
    CE_LOC: [3, 6, 9]
    CE_KEEP_RATIO: [0.7, 0.7, 0.7]
    CE_TEMPLATE_RANGE: 'CTR_POINT'  
    ADD_CLS_TOKEN: True            
    ATTN_TYPE: concat               
  HEAD:
    TYPE: CENTER
    NUM_CHANNELS: 256

TRAIN:
  BBOX_TASK: True
  BACKBONE_MULTIPLIER: 0.1
  DROP_PATH_RATE: 0.1
  BATCH_SIZE: 4
  NUM_WORKER: 10
  EPOCH: 300
  LR_DROP_EPOCH: 240
  GIOU_WEIGHT: 2.0
  L1_WEIGHT: 5.0
  GRAD_CLIP_NORM: 0.1
  LR: 0.0001
  OPTIMIZER: ADAMW
  PRINT_INTERVAL: 50
  SCHEDULER:
    TYPE: step
    DECAY_RATE: 0.1
  VAL_EPOCH_INTERVAL: 2
  WEIGHT_DECAY: 0.0001
  AMP: False
  FINETUNE_FROM: ""
  
TEST:
  EPOCH: 300
  SEARCH_FACTOR: 5.0
  SEARCH_SIZE: 384
  TEMPLATE_FACTOR: 2.0
  TEMPLATE_SIZE: 192
  TEMPLATE_NUMBER: 3
  MEMORY_THRESHOLD: 1000
  USE_GATED_MS: true
  SCALE_FACTORS: [0.95, 1.0, 1.05]
  UNCERTAINTY_THRESHOLD: 0.98
  USE_KALMAN: true
  KALMAN_ALPHA: 0.5 
