export CUDA_VISIBLE_DEVICES=4,5,6,7
python src/inference_time/predict_vllm.py \
    --dataset viquae_mc \
    --model_name llava-hf/llava-v1.6-vicuna-13b-hf \
    --greedy \
    --output_dir outputs/inference_time/viquae \
    --max_new_tokens 10 \
    --method post_hoc \
    --conflict_prompt fixed
