{
  "model": {
    "model_cls": "VideoChat2_it",
    "vit_blip_model_path": "xxx/umt_l16_qformer.pth",
    "llama_model_path": "xxx/vicuna-7b-v0",
    "videochat2_model_path": "xxx/videochat2_7b_stage2.pth",
    "freeze_vit": false,
    "freeze_qformer": false,
    "max_txt_len": 512,
    "low_resource": false,
    "vision_encoder": {
      "name": "vit_l14",
      "img_size": 224,
      "patch_size": 16,
      "d_model": 1024,
      "encoder_embed_dim": 1024,
      "encoder_depth": 24,
      "encoder_num_heads": 16,
      "drop_path_rate": 0.0,
      "num_frames": 32,
      "tubelet_size": 1,
      "use_checkpoint": false,
      "checkpoint_num": 0,
      "pretrained": "",
      "return_index": -2,
      "vit_add_ln": true,
      "ckpt_num_frame": 4
    },
    "num_query_token": 32,
    "qformer_hidden_dropout_prob": 0.1,
    "qformer_attention_probs_dropout_prob": 0.1,
    "qformer_drop_path_rate": 0.2,
    "extra_num_query_token": 64,
    "qformer_text_input": true,
    "system": "",
    "start_token": "<Video>",
    "end_token": "</Video>",
    "img_start_token": "<Image>",
    "img_end_token": "</Image>",
    "random_shuffle": true,
    "use_lora": false,
    "lora_r": 16,
    "lora_alpha": 32,
    "lora_dropout": 0.1
  },
  "device": "cuda"
}
