# Download pre-trained weight for image captioning (CLIP-CAP and BLIP)
pip install gdown
gdown  1ocKr2gWCx20QRykqxCddhTwiXaEnRLS_
mv clip_cap_coco_weight.pt external/clipcap/