

CUDA_VISIBLE_DEVICES=1 python src/Inference/infer_llama_vllm_truthfulqa.py \
        --model_name /data/share/models/llama-2-7b-chat-hf \
        --batch_size 8 \
        --save_name /data/huanghj/Contrastive/Idk_datasets/sft_data/llama-2-7b-chat/truthfulqa_test_tp1.0_10responses_with_em_labels.json \
        --prompt_file /data/huanghj/Contrastive/Idk_datasets/sft_data/TruthfulQA.csv \
        --response_num 10 \
        --top_p 1.0 \
        --top_k -1 \
        --temperature 0.7 \
        --tensor_parallel_size 1