includes: projects/task/test_vtt.yaml
model:
  model_cls: MMFusionSeparate
  mm_encoder_cls: 
  video_encoder_cls: MMBertForEncoder
  text_encoder_cls: BertModel
  num_hidden_video_layers: 6
eval:
  save_path: runs/task/vtt_zs/eval
fairseq:
  # read code and find what is the checkpoint arg.
  common_eval:
    path: runs/task/checkpoint_best.pt
