#!/bin/bash
CUDA_VISIBLE_DEVICES=3 python -m vlm_eval.run_evaluation \
--eval_textvqa \
--attack ensemble --eps 2 --steps 100 --mask_out context \
--vision_encoder_pretrained  /inspire/hdd/global_user/usr-240108540162/RobustVLM/output/ViT-L-14_imagenet_l2_pgd_fintune_strength2-Template1_42_0_U0Zs2/checkpoints/final.pt \
--num_samples 100 \
--shots 0 \
--batch_size 1 \
--results_file res9B \
--model open_flamingo \
--out_base_path /inspire/hdd/global_user/usr-240108540162/RobustVLM-HF-4090/open_flamingo/output-Sr2 \
--vision_encoder_path /inspire/hdd/global_user/usr-240108540162/offline/clip-vit-large-patch14 \
--checkpoint_path /inspire/hdd/global_user/usr-240108540162/RobustVLM-HF-4090/open_flamingo/OpenFlamingo-9B-vitl-mpt7b/checkpoint.pt \
--lm_path /inspire/hdd/global_user/usr-240108540162/mpt-7b \
--lm_tokenizer_path /inspire/hdd/global_user/usr-240108540162/mpt-7b \
--precision float16 \
--cross_attn_every_n_layers 4 \
--coco_train_image_dir_path /inspire/hdd/global_user/usr-240108540162/COCO/train2014 \
--coco_val_image_dir_path /inspire/hdd/global_user/usr-240108540162/COCO/val2014 \
--coco_karpathy_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/mscoco_karpathy/karpathy_coco.json \
--coco_annotations_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/mscoco_karpathy/annotations/captions_val2014.json \
--flickr_image_dir_path /inspire/hdd/global_user/usr-240108540162/flickr30k/flickr30k-images \
--flickr_karpathy_json_path /inspire/hdd/global_user/usr-240108540162/flickr30k/Annotations/karpathy_flickr30k.json \
--flickr_annotations_json_path /inspire/hdd/global_user/usr-240108540162/flickr30k/Annotations/dataset_flickr30k_coco_style.json \
--vizwiz_train_image_dir_path /inspire/hdd/global_user/usr-240108540162/vizwiz/train \
--vizwiz_test_image_dir_path /inspire/hdd/global_user/usr-240108540162/vizwiz/val \
--vizwiz_train_questions_json_path /inspire/hdd/global_user/usr-240108540162/vizwiz/train_questions_vqa_format.json \
--vizwiz_train_annotations_json_path /inspire/hdd/global_user/usr-240108540162/vizwiz/train_annotations_vqa_format.json \
--vizwiz_test_questions_json_path /inspire/hdd/global_user/usr-240108540162/vizwiz/val_questions_vqa_format.json \
--vizwiz_test_annotations_json_path /inspire/hdd/global_user/usr-240108540162/vizwiz/val_annotations_vqa_format.json \
--vqav2_train_image_dir_path /inspire/hdd/global_user/usr-240108540162/COCO/train2014 \
--vqav2_train_questions_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/vqav2/v2_OpenEnded_mscoco_train2014_questions.json \
--vqav2_train_annotations_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/vqav2/v2_mscoco_train2014_annotations.json \
--vqav2_test_image_dir_path /inspire/hdd/global_user/usr-240108540162/COCO/val2014 \
--vqav2_test_questions_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/vqav2/v2_OpenEnded_mscoco_val2014_questions.json \
--vqav2_test_annotations_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/vqav2/v2_mscoco_val2014_annotations.json \
--textvqa_image_dir_path /inspire/hdd/global_user/usr-240108540162/textvqa/train_images \
--textvqa_train_questions_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/textvqa/train_questions_vqa_format.json \
--textvqa_train_annotations_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/textvqa/train_annotations_vqa_format.json \
--textvqa_test_questions_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/textvqa/val_questions_vqa_format.json \
--textvqa_test_annotations_json_path /inspire/hdd/global_user/usr-240108540162/eval_benchmark/textvqa/val_annotations_vqa_format.json