import argparse
import pandas as pd
from evaluator.MMBench_s import test_model_multiple
from Models.Qwen_VL_Chat_lora import QwenVLChatLora
from Models.InternVL2_Lora import InternVL2Lora
from Models.mPLUG_Lora import mPLUGLora
from utils.ECE import *
from utils.utils import *
import argparse
from main.Ask import get_model_class
from Models.ChatGPT_4o import GPT4o

def main(args):
    
    if 'qwen-vl-chat-lora' in args.model_path.lower():   
        model = QwenVLChatLora(args)
    elif 'work_dirs' in args.model_path.lower():
        model = InternVL2Lora(args)
    elif 'ms-swift' in args.model_path.lower():
        model = mPLUGLora(args)
    elif args.model_path == None:
        model = GPT4o(args)
    else:
        ModelClass = get_model_class(args.model_path)
        model = ModelClass(args)

    data = pd.read_parquet(args.data_path)
    test_model_multiple(model, args, repeat=3)

if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Accuracy of MMBench evaluation")
    parser.add_argument('--model_path', type=str,help="Path to the pre-trained or distilled model file. Specify the location of the model.")
    parser.add_argument('--device', type=str, default="cuda:0")
    parser.add_argument('--data_path', type=str, help="Path to the dataset.")
    parser.add_argument('--temperature', type=float, default=1.0)
    parser.add_argument('--num_test_samples', type=int, default=4329)
    parser.add_argument('--dataset_name', type=str, default="MMBench", help="Dataset Name, serve as savedir")
    parser.add_argument('--split', type=str, default="test",help="The Part of Dataset")
    parser.add_argument("--conv_mode", default="llava_llama_2",help="The system prompt of model")
    args = parser.parse_args()

    main(args)

  