task=Eval_CGUB_cat_on_flickr8k
python -m llava.eval.model_vqa_loader \
    --model_base liuhaotian/llava-v1.5-7b\
    --model_path ./cgub/checkpoints/flickr8k/attack/llava-v1.5-7b-cgub-attack-on-cat\
    --concept_path ./cgub/checkpoints/flickr8k/llava-v1.5-concept-100/concept.bin\
    --question_file ./cgub/data/eval/coco/test.jsonl \
    --image_folder /pretrained/lavis_cache/coco/images \
    --temperature 1 \
    --conv-mode vicuna_v1 \
    --coco_gt_file /pretrained/lavis_cache/flickr8k/flickr8k_caption_gt/flickr8k_caption_test_gt.json \
    --answers_file ./checkpoints/EVAL/${task}/result_$(date +%Y%m%d_%H%M%S).json \
    --save_path ./checkpoints/EVAL/${task}/metrics.json \
    --gpu 0\
    --max_new_tokens 30 \
    --min_new_tokens 8 \
    --num_beams 5\
    --top_p 0.9\
    
