 # Copyright (c) 2023, salesforce.com, inc.
 # All rights reserved.
 # SPDX-License-Identifier: BSD-3-Clause
 # For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause

model:
  arch: blip2_vicuna_xinstruct
  model_type: vicuna7b
  load_pretrained: True
  load_finetuned: False
  finetuned: ""
  stage1_url_or_filename: null
  image_model: "eva_clip_g"
  pc_model: "ulip2_pointbert"
  video_model: "eva_clip_g"
  audio_model: "beats"
  pretrained_image_qformer: https://storage.googleapis.com/sfr-xinstructblip-data-research/model/xinstructblip_checkpoints/vicuna7b/image_pre_coco.pth
  pretrained_pc_qformer: https://storage.googleapis.com/sfr-xinstructblip-data-research/model/xinstructblip_checkpoints/vicuna7b/pc_qformer.pth
  pretrained_video_qformer: https://storage.googleapis.com/sfr-xinstructblip-data-research/model/xinstructblip_checkpoints/vicuna7b/video_qformer.pth
  pretrained_audio_qformer: https://storage.googleapis.com/sfr-xinstructblip-data-research/model/xinstructblip_checkpoints/vicuna7b/audio_qformer.pth
  load_attention_image_qformer: True
  load_attention_pc_qformer: True
  load_attention_video_qformer: True
  load_attention_audio_qformer: True
  load_ln_type_image: "image"
  load_ln_type_video: "video"
  load_ln_type_pc: "pc"
  load_ln_type_audio: "audio"
  load_qformer_type_image: "image"
  load_qformer_type_pc: "pc"
  load_qformer_type_video: "video"
  load_qformer_type_audio: "audio"
  load_projection_image: True
  load_projection_pc: True
  load_projection_video: True
  load_projection_audio: True
  load_projection_type_image: "image"
  load_projection_type_pc: "pc"
  load_projection_type_video: "video"
  load_projection_type_audio: "audio"
  image_encoder_kwargs :  {"image_size": 224, "drop_path_rate": 0, "use_grad_checkpoint": False}
  pc_encoder_kwargs :  {}
  video_encoder_kwargs :   {"image_size": 224, "drop_path_rate": 0, "use_grad_checkpoint": False}
  audio_encoder_kwargs :  {}
  image_precision: "fp16"
  pc_precision: "fp16"
  video_precision: "fp16"
  audio_precision: "fp16"
  freeze_image: True
  freeze_pc: True
  freeze_video: True
  freeze_audio: True
  num_query_token: 32
  llm_model: /path/to/vicuna-7b
  prompt: a short description
  max_txt_len: 128
  max_output_txt_len: 256
  apply_lemmatizer: False
  num_few_shot_examples: 0
  few_shot_prob: 0
  qformer_text_input: True
  llm_text_input: True
  modalities :  ["image"]
  use_cues: True
  shared_qformer: False
  pretrained_shared_qformer: Null
  load_attention_shared_qformer: False
  load_qformer_type_shared: ""
  load_projection_shared: False
  load_projection_type_shaped: ""
  load_ln_type_shared: ""
  shared_qformer_num_features: 512
  prefix: ""
  postfix: ""
  predict_with_gen: False

datasets:
  nocaps: # name of the dataset builder
    # data_dir: ${env.data_dir}/datasets
    data_type: images # [images|videos|features]

    vis_processor:
      train:
        name: "clip_image_train"
        image_size: 224
      eval:
        name: "clip_image_eval"
        image_size: 224

    build_info:
      # Be careful not to append minus sign (-) before split to avoid itemizing
      annotations:
        val:
          url: https://storage.googleapis.com/sfr-vision-language-research/datasets/nocaps_val.json
          storage:  nocaps/annotations/nocaps_val.json
        test:
          url: https://storage.googleapis.com/sfr-vision-language-research/datasets/nocaps_test.json
          storage: nocaps/annotations/nocaps_test.json
      images:
        storage: /export/share/datasets/vision/nocaps/

run:
  task: captioning
  # optimizer
  lr_sched: "linear_warmup_cosine_lr"
  init_lr: 1e-5
  min_lr: 0
  warmup_lr: 1e-8
  warmup_steps: 1000
  weight_decay: 0.05
  max_epoch: 1
  batch_size_train: 16
  batch_size_eval: 8
  num_workers: 8
  accum_grad_iters: 1

  max_len: 80
  min_len: 10
  num_beams: 5
  inference_method: "generate"
  prompt: a short description
  length_penalty: 1.

  annotation_file: https://nocaps.s3.amazonaws.com/nocaps_val_4500_captions.json


  seed: 42
  output_dir: "output/xinstructblip/eval/vicuna7b/image_pre_coco/nocaps_out_domain_captioning/"


  amp: True
  resume_ckpt_path: null

  evaluate: True
  # train_splits: ["train"]
  valid_splits: ["val"]


  device: "cuda"
  world_size: 1
  dist_url: "env://"
  distributed: True
  save_freq: -1 # save epoch every xxx epochs -1 only save last and best. 
  val_freq: 1

  img_ids: [2, 4, 5, 8, 15, 18, 19, 22, 27, 30, 33, 35, 41, 42, 43, 46, 47, 51, 59, 60, 64, 65, 68, 69, 71, 72, 73, 77, 79, 81, 85, 87, 88, 90, 92, 100, 101, 102, 105, 107, 109, 115, 120, 124, 125, 126, 127, 129, 133, 135, 137, 139, 140, 141, 143, 150, 153, 155, 158, 164, 165, 167, 170, 171, 173, 182, 190, 191, 196, 200, 201, 203, 205, 208, 219, 225, 226, 228, 229, 232, 239, 240, 243, 245, 250, 262, 263, 264, 267, 272, 278, 283, 284, 290, 291, 297, 301, 304, 305, 309, 310, 311, 314, 323, 325, 329, 330, 331, 333, 334, 341, 349, 350, 351, 352, 354, 358, 359, 363, 365, 366, 368, 371, 372, 379, 381, 383, 386, 388, 389, 390, 392, 405, 415, 417, 418, 420, 421, 424, 428, 429, 432, 436, 441, 443, 452, 453, 454, 455, 456, 459, 464, 465, 468, 469, 476, 477, 478, 480, 487, 488, 490, 491, 493, 500, 502, 504, 506, 509, 510, 511, 512, 515, 516, 520, 527, 529, 533, 539, 540, 541, 544, 545, 547, 551, 554, 556, 559, 577, 579, 580, 582, 586, 587, 590, 593, 594, 607, 609, 616, 617, 619, 623, 628, 631, 634, 637, 648, 651, 654, 655, 665, 673, 678, 682, 684, 685, 688, 690, 695, 696, 701, 702, 705, 707, 708, 712, 714, 718, 719, 723, 725, 726, 730, 731, 733, 734, 740, 744, 748, 750, 751, 756, 757, 760, 761, 763, 767, 775, 779, 782, 783, 784, 787, 790, 792, 794, 798, 799, 802, 805, 807, 810, 812, 816, 818, 819, 820, 821, 829, 831, 836, 841, 842, 844, 845, 849, 850, 853, 854, 857, 859, 861, 868, 871, 874, 875, 877, 879, 886, 887, 889, 890, 891, 892, 893, 894, 896, 899, 900, 905, 918, 924, 926, 927, 929, 932, 934, 935, 943, 948, 950, 952, 953, 954, 956, 957, 963, 965, 969, 972, 973, 974, 976, 980, 985, 987, 988, 990, 992, 993, 994, 1000, 1001, 1003, 1005, 1009, 1013, 1016, 1018, 1019, 1020, 1021, 1022, 1024, 1028, 1029, 1033, 1036, 1037, 1038, 1042, 1045, 1046, 1050, 1053, 1054, 1056, 1065, 1072, 1076, 1079, 1082, 1083, 1096, 1101, 1103, 1107, 1112, 1117, 1129, 1132, 1133, 1136, 1138, 1141, 1143, 1155, 1157, 1160, 1164, 1165, 1166, 1172, 1175, 1179, 1183, 1194, 1197, 1200, 1202, 1210, 1228, 1234, 1236, 1241, 1246, 1251, 1253, 1255, 1261, 1265, 1268, 1269, 1271, 1272, 1273, 1277, 1286, 1287, 1290, 1296, 1297, 1302, 1303, 1308, 1310, 1312, 1315, 1316, 1317, 1320, 1321, 1324, 1327, 1329, 1330, 1331, 1333, 1334, 1336, 1338, 1339, 1340, 1345, 1347, 1356, 1362, 1366, 1371, 1374, 1376, 1381, 1384, 1385, 1388, 1394, 1396, 1397, 1398, 1403, 1404, 1408, 1410, 1413, 1414, 1417, 1424, 1430, 1433, 1436, 1438, 1440, 1446, 1449, 1453, 1454, 1456, 1460, 1462, 1464, 1465, 1467, 1470, 1473, 1477, 1491, 1494, 1498, 1504, 1506, 1509, 1511, 1515, 1519, 1524, 1530, 1533, 1540, 1541, 1549, 1557, 1558, 1561, 1570, 1572, 1575, 1579, 1591, 1593, 1594, 1595, 1596, 1602, 1605, 1609, 1611, 1615, 1617, 1618, 1624, 1625, 1627, 1636, 1637, 1639, 1640, 1641, 1646, 1647, 1648, 1649, 1655, 1656, 1657, 1658, 1659, 1662, 1671, 1675, 1679, 1681, 1690, 1692, 1701, 1712, 1715, 1716, 1718, 1719, 1721, 1723, 1725, 1728, 1729, 1730, 1732, 1737, 1740, 1746, 1747, 1753, 1754, 1756, 1757, 1758, 1761, 1762, 1767, 1771, 1773, 1775, 1779, 1783, 1784, 1786, 1787, 1789, 1791, 1794, 1802, 1803, 1807, 1813, 1814, 1815, 1817, 1824, 1826, 1827, 1832, 1834, 1835, 1838, 1839, 1840, 1841, 1842, 1843, 1844, 1847, 1850, 1860, 1861, 1866, 1870, 1872, 1873, 1876, 1878, 1886, 1889, 1894, 1897, 1899, 1902, 1907, 1911, 1912, 1917, 1920, 1924, 1925, 1928, 1931, 1935, 1936, 1937, 1939, 1941, 1946, 1948, 1949, 1952, 1954, 1955, 1956, 1959, 1967, 1968, 1970, 1975, 1976, 1979, 1980, 1985, 1986, 1994, 1996, 1998, 2001, 2003, 2007, 2009, 2011, 2012, 2014, 2019, 2028, 2029, 2042, 2047, 2049, 2050, 2060, 2068, 2071, 2076, 2078, 2080, 2081, 2086, 2089, 2090, 2093, 2094, 2099, 2102, 2107, 2112, 2115, 2121, 2124, 2125, 2129, 2131, 2133, 2135, 2140, 2141, 2148, 2150, 2151, 2152, 2155, 2163, 2173, 2176, 2178, 2182, 2183, 2187, 2188, 2196, 2197, 2198, 2199, 2200, 2205, 2207, 2209, 2215, 2217, 2220, 2221, 2223, 2230, 2235, 2236, 2237, 2238, 2241, 2242, 2243, 2244, 2246, 2252, 2253, 2261, 2265, 2274, 2277, 2278, 2281, 2286, 2290, 2292, 2293, 2294, 2296, 2299, 2301, 2304, 2305, 2307, 2309, 2312, 2314, 2315, 2319, 2323, 2324, 2337, 2338, 2339, 2340, 2342, 2351, 2356, 2358, 2360, 2367, 2369, 2371, 2374, 2376, 2378, 2382, 2383, 2387, 2388, 2390, 2399, 2400, 2412, 2416, 2422, 2423, 2427, 2428, 2435, 2439, 2440, 2442, 2447, 2450, 2455, 2459, 2461, 2462, 2463, 2466, 2468, 2470, 2479, 2480, 2482, 2483, 2485, 2488, 2491, 2495, 2496, 2502, 2505, 2506, 2507, 2510, 2511, 2515, 2522, 2524, 2532, 2534, 2546, 2547, 2550, 2554, 2558, 2562, 2563, 2574, 2583, 2584, 2590, 2594, 2598, 2602, 2603, 2606, 2611, 2613, 2615, 2617, 2619, 2623, 2625, 2630, 2636, 2642, 2643, 2644, 2646, 2647, 2649, 2650, 2659, 2661, 2664, 2674, 2675, 2677, 2682, 2684, 2685, 2691, 2693, 2695, 2698, 2699, 2703, 2704, 2706, 2707, 2711, 2713, 2719, 2720, 2723, 2726, 2727, 2729, 2730, 2733, 2734, 2738, 2739, 2741, 2744, 2745, 2748, 2749, 2754, 2757, 2761, 2762, 2764, 2765, 2767, 2768, 2772, 2776, 2778, 2779, 2780, 2781, 2783, 2787, 2791, 2795, 2796, 2799, 2800, 2802, 2807, 2808, 2811, 2813, 2817, 2820, 2827, 2829, 2831, 2833, 2834, 2835, 2839, 2840, 2841, 2846, 2847, 2849, 2852, 2855, 2859, 2860, 2864, 2870, 2871, 2876, 2878, 2879, 2882, 2884, 2885, 2886, 2887, 2888, 2895, 2896, 2897, 2898, 2900, 2902, 2905, 2911, 2913, 2915, 2919, 2922, 2924, 2933, 2939, 2945, 2953, 2954, 2958, 2959, 2968, 2973, 2976, 2979, 2982, 2984, 2992, 3002, 3004, 3007, 3008, 3009, 3010, 3013, 3016, 3021, 3022, 3023, 3026, 3028, 3033, 3036, 3037, 3039, 3043, 3044, 3045, 3046, 3053, 3060, 3062, 3063, 3071, 3072, 3085, 3086, 3092, 3095, 3096, 3102, 3103, 3104, 3105, 3111, 3115, 3116, 3122, 3129, 3131, 3132, 3137, 3138, 3140, 3147, 3148, 3157, 3164, 3167, 3168, 3170, 3175, 3179, 3182, 3184, 3190, 3194, 3196, 3198, 3199, 3200, 3215, 3216, 3217, 3219, 3222, 3229, 3230, 3237, 3239, 3242, 3249, 3253, 3255, 3257, 3258, 3267, 3270, 3271, 3274, 3279, 3288, 3290, 3291, 3293, 3299, 3305, 3306, 3312, 3318, 3319, 3320, 3323, 3326, 3328, 3329, 3335, 3343, 3344, 3345, 3347, 3349, 3350, 3353, 3356, 3362, 3364, 3366, 3369, 3374, 3377, 3379, 3381, 3382, 3384, 3385, 3388, 3389, 3395, 3399, 3403, 3409, 3411, 3416, 3419, 3421, 3423, 3424, 3425, 3427, 3428, 3431, 3437, 3438, 3439, 3444, 3450, 3452, 3453, 3456, 3457, 3460, 3461, 3462, 3464, 3466, 3467, 3471, 3472, 3477, 3478, 3482, 3484, 3486, 3492, 3499, 3500, 3501, 3502, 3511, 3525, 3529, 3531, 3533, 3534, 3536, 3552, 3553, 3555, 3557, 3562, 3567, 3568, 3570, 3571, 3573, 3577, 3578, 3584, 3585, 3586, 3587, 3595, 3600, 3601, 3604, 3609, 3610, 3612, 3615, 3616, 3619, 3620, 3624, 3625, 3631, 3632, 3636, 3637, 3638, 3640, 3643, 3651, 3654, 3655, 3656, 3657, 3662, 3667, 3668, 3671, 3677, 3684, 3686, 3689, 3693, 3694, 3696, 3697, 3698, 3699, 3700, 3701, 3703, 3704, 3707, 3708, 3709, 3711, 3712, 3713, 3714, 3719, 3721, 3723, 3726, 3737, 3741, 3742, 3744, 3750, 3752, 3757, 3760, 3761, 3764, 3765, 3767, 3770, 3772, 3774, 3776, 3778, 3780, 3781, 3796, 3797, 3805, 3818, 3819, 3820, 3821, 3824, 3841, 3845, 3848, 3851, 3858, 3866, 3870, 3871, 3876, 3879, 3880, 3883, 3893, 3896, 3900, 3903, 3904, 3908, 3909, 3913, 3914, 3916, 3924, 3927, 3937, 3940, 3942, 3943, 3949, 3950, 3953, 3954, 3959, 3963, 3966, 3969, 3972, 3978, 3981, 3983, 3984, 3986, 3989, 3990, 3991, 3999, 4000, 4004, 4005, 4006, 4012, 4014, 4016, 4017, 4019, 4020, 4030, 4035, 4046, 4049, 4051, 4052, 4053, 4057, 4061, 4065, 4066, 4068, 4073, 4074, 4075, 4079, 4080, 4082, 4084, 4086, 4090, 4091, 4093, 4094, 4095, 4096, 4100, 4102, 4104, 4106, 4113, 4114, 4115, 4116, 4118, 4124, 4126, 4127, 4128, 4131, 4133, 4134, 4142, 4145, 4149, 4156, 4160, 4171, 4174, 4178, 4179, 4180, 4183, 4186, 4190, 4191, 4195, 4197, 4215, 4220, 4229, 4234, 4245, 4249, 4251, 4252, 4254, 4257, 4259, 4264, 4265, 4266, 4267, 4275, 4276, 4277, 4282, 4284, 4285, 4288, 4291, 4294, 4295, 4301, 4302, 4313, 4315, 4320, 4328, 4333, 4336, 4339, 4342, 4345, 4346, 4350, 4354, 4372, 4374, 4375, 4377, 4379, 4380, 4386, 4388, 4389, 4392, 4396, 4402, 4404, 4408, 4410, 4424, 4426, 4428, 4431, 4435, 4436, 4439, 4442, 4446, 4447, 4449, 4452, 4455, 4458, 4460, 4461, 4466, 4469, 4475, 4476, 4478, 4488, 4491, 4494, 4498]
