name: 002_CFANet_Res50_cap
# name: debug_model
model_type: GeneralIQAModel 
num_gpu: 1  # set num_gpu: 0 for cpu mode
manual_seed: 123 

define: &img_size_oneside 224
define: &img_size [*img_size_oneside, *img_size_oneside]

define: &backbone resnet50

define: &train_batch_size 64
define: &test_batch_size 16

# dataset and data loader settings
datasets:
  train:
    name: lcy
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR_train.csv
    mos_range: [0, 5]
    lower_better: false 
    mos_normalize: true

    augment:
      hflip: true
      random_crop: 128
    img_range: 1

    # data loader
    use_shuffle: true
    num_worker_per_gpu: 16
    batch_size_per_gpu: 256
    dataset_enlarge_ratio: 1
    prefetch_mode: ~
    phase: train

  # val_0:
  #   name: All
  #   type: GeneralNRDataset
  #   dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
  #   meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_All.csv
  #   img_range: 1
  #   phase: val
  
  val_1:
    name: score1
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_score1.csv
    img_range: 1
    phase: val
  
  val_2:
    name: score2
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_score2.csv
    img_range: 1
    phase: val
  
  val_3:
    name: score3
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_score3.csv
    img_range: 1
    phase: val
  
  val_4:
    name: perspective_F
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_perspective_F.csv
    img_range: 1
    phase: val
  
  val_5:
    name: perspective_T
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_perspective_T.csv
    img_range: 1
    phase: val
  
  val_6:
    name: reality_R
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_reality_R.csv
    img_range: 1
    phase: val
  
  val_7:
    name: reality_S
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_reality_S.csv
    img_range: 1
    phase: val
  
  # val_8:
  #   name: Object_Daily
  #   type: GeneralNRDataset
  #   dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
  #   meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_Object_Daily.csv
  #   img_range: 1
  #   phase: val
  
  # val_9:
  #   name: Object_Industrial
  #   type: GeneralNRDataset
  #   dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
  #   meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_Object_Industrial.csv
  #   img_range: 1
  #   phase: val
  
  val_10:
    name: dis-level_S4
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_dis-level_S4.csv
    img_range: 1
    phase: val
  
  val_11:
    name: dis-level_S5
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_dis-level_S5.csv
    img_range: 1
    phase: val
  
  val_12:
    name: dis-level_S6
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_dis-level_S6.csv
    img_range: 1
    phase: val
  
  val_13:
    name: dis-level_S7
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_dis-level_S7.csv
    img_range: 1
    phase: val
  
  val_14:
    name: dis-level_S8
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_dis-level_S8.csv
    img_range: 1
    phase: val

  # val_15:
  #   name: cross-vlm
  #   type: GeneralNRDataset
  #   dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_distorted_all
  #   meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_vlm.csv
  #   img_range: 1
  #   phase: val

  # val_16:
  #   name: cross-tid
  #   type: GeneralNRDataset
  #   dataroot_target: /tos-bjml-researcheval/wenfarong/dataset/tid2013/distorted_images
  #   meta_info_file: /tos-bjml-researcheval/wenfarong/dataset/tid2013/NR_mos_with_names_tiny_0-5.csv
  #   img_range: 1
  #   phase: val


  # val_17:
  #   name: cross-live
  #   type: GeneralNRDataset
  #   dataroot_target: /tos-bjml-researcheval/wenfarong/dataset/live
  #   meta_info_file: /tos-bjml-researcheval/wenfarong/dataset/live/NR_filename_mos_half_0-5.csv
  #   img_range: 1
  #   phase: val

  val_18:
    name: bottom_50
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_bottom_50.csv
    img_range: 1
    phase: val

  val_19:
    name: middle_50
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_middle_50.csv
    img_range: 1
    phase: val

  val_20:
    name: top_50
    type: GeneralNRDataset
    dataroot_target: /fs-computility/ResearchEval/shared/xiaojiahao/MY_DATA_1000_all
    meta_info_file: /fs-computility/ResearchEval/xiaojiahao/project/vlm_meta_info/vlm_meta_info_sampled/NR/NR_top_50.csv
    img_range: 1
    phase: val

# network structures
network:
  type: CFANet 
  use_ref: false
  pretrained: false
  num_crop: 1 
  num_attn_layers: 1
  crop_size: 128
  semantic_model_name: *backbone
  block_pool: weighted_avg

# path
path:
  strict_load_g: true
  resume_state: ~
  experiments_root: /fs-computility/ResearchEval/xiaojiahao/models/IQA-PyTorch/experiments/001_frAHIQ
  models: /fs-computility/ResearchEval/xiaojiahao/models/IQA-PyTorch/experiments/001_frAHIQ/models
  training_states: /fs-computility/ResearchEval/xiaojiahao/models/IQA-PyTorch/experiments/001_frAHIQ/training_states
  log: /fs-computility/ResearchEval/xiaojiahao/models/IQA-PyTorch/experiments/001_frAHIQ
  visualization: /fs-computility/ResearchEval/xiaojiahao/models/IQA-PyTorch/experiments/001_frAHIQ/visualization


# training settings
train:
  optim:
    type: AdamW
    lr: !!float 3e-5 
    weight_decay: !!float 1e-5
  
  scheduler:
    type: CosineAnnealingLR
    T_max: 50 
    eta_min: 0 
    # type: StepLR 
    # step_size: !!float 1e9
    # gamma: 1.0 

  total_iter: 50000
  total_epoch: 20
  warmup_iter: -1  # no warm up
  
  # losses
  mos_loss_opt:
    type: MSELoss 
    loss_weight: !!float 1.0

  metric_loss_opt:
    type: NiNLoss 
    loss_weight: !!float 1.0

# validation settings
val:
  val_freq: !!float 200 
  save_img: false
  pbar: true

  key_metric: srcc # if this metric improve, update all metrics. If not specified, each best metric results will be updated separately 
  metrics:
    srcc: 
      type: calculate_srcc

    plcc: 
      type: calculate_plcc
    
    krcc:
      type: calculate_krcc

# logging settings
logger:
  print_freq: 10
  save_latest_freq: !!float 500 
  log_imgs_freq: 1000
  use_tb_logger: true
  wandb:
    project: ~
    resume_id: ~

# dist training settings
dist_params:
  backend: nccl
  port: 29500

find_unused_parameters: True
dist: False
rank: 0
world_size: 1
auto_resume: False
is_train: True
root_path: /fs-computility/ResearchEval/xiaojiahao/models/IQA-PyTorch
