import json
from tqdm import tqdm
import random
from datasets import load_dataset
import ast
from swift.llm import (
        get_model_tokenizer, get_template, inference, ModelType,
        get_default_template_type, inference_stream
    )
from swift.utils import seed_everything
import logging
from .utils import *

def extract_options(options_str):
    try:
        options = ast.literal_eval(options_str)
    except (SyntaxError, ValueError):
        print(f"Error parsing options: {options_str}")
        options = []
    return options

def MMMU_val(args,val_data, model, template ):
    seed_everything(42)
    args.local_image_path = '/Uncertainty_MLLMs/MMMU/val/'
    val_data=list(val_data)
    val_data = [item for item in val_data if item['question_type'] == 'multiple-choice']

    chiocels0=['A','B','C','D','E','F','G','H','I','J']
    for index, item in enumerate(val_data):
        item['index'] = item.pop('id')
        choices={}
        item['options']=extract_options(item['options'])
        for id_ch,choice in enumerate(item['options']):
            choices[chiocels0[id_ch]]=choice
        item['choices'] = choices

    answer_all=[]
    for idx, item in enumerate(tqdm(val_data, desc="All data")):
        index = item["index"]
        question = item["question"]
        question_type = item["question_type"]
        choices = item['choices']
        answer = item["answer"]
        img_type = item["img_type"]
        topic_difficulty = item["topic_difficulty"]
        subfield = item["subfield"]
        
        prompt= construct_query_base_MC(question,choices)

        image = os.path.join(args.local_image_path, index) + '.jpg'
        if args.api_model:
            response_temp = get_all_model_api_result(args, prompt, image)
        elif args.model_type == 'phi3-vision-128k-instruct':
            prompt = f'<img>{image}</img>{prompt}'
            response_temp, _ = inference(model, template, prompt, temperature=args.tempeature)
        else :
            response_temp, _ = inference(model, template, prompt, images=image,temperature=args.tempeature)
        response = extract_option(response_temp, question)
        answer_data_json = {
            'index': index,
            'question': question,
            'question_type': question_type,
            'choices':choices,
            'answer' : answer,
            'response': response,
            'response_temp': response_temp,
            'img_type' : img_type ,
            'topic_difficulty': topic_difficulty,
            'subfield' : subfield,
            'prompt': prompt
        }
        answer_all.append(answer_data_json)

    save_path = cacluate_current_time_save_path('all', args)
    json.dump(answer_all, open(save_path, 'w',encoding='utf-8'),
                      indent=2, ensure_ascii=False)
    consistent_ratio, inconsistent_ratio = calculate_consistency_MC(answer_all,'All data-')

    filtered_data = []
    valid_answers = {'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H','I','J'}
    for item in  answer_all:
        filtered_data.append(item)


    filtered_data_false_true = []
    filtered_data_true_false = []
    for item in filtered_data:
        response = item['response']
        true_answer  = item['answer']

        if  true_answer == response :
            filtered_data_true_false.append(item)
        elif response == -2 :
            pass
        else:
            filtered_data_false_true.append(item)

    save_path= cacluate_current_time_save_path('all_false',args)
    json.dump(filtered_data_false_true, open(save_path, 'w',encoding='utf-8'),
                        indent=2, ensure_ascii=False)

    save_path= cacluate_current_time_save_path('all_true',args)
    json.dump(filtered_data_true_false, open(save_path, 'w',encoding='utf-8'),
                        indent=2, ensure_ascii=False)
    

    logging.info(f"False Count:{len(filtered_data_false_true)}")
    for i in range(1):
        answer_new_F_T = []
        for qid, item in enumerate(tqdm(filtered_data_false_true, desc="False->True")):
            index = item["index"]
            question = item["question"]
            question_type = item["question_type"]
            choices = item['choices']
            answer = item["answer"]
            img_type = item["img_type"]
            topic_difficulty = item["topic_difficulty"]
            subfield = item["subfield"]
            
            prompt= construct_query_MC(question,choices,answer)

            image = os.path.join(args.local_image_path, index) + '.jpg'
            if args.api_model:
                response_temp = get_all_model_api_result(args, prompt, image)
            elif args.model_type == 'phi3-vision-128k-instruct':
                prompt = f'<img>{image}</img>{prompt}'
                response_temp, _ = inference(model, template, prompt, temperature=args.tempeature)
            else :
                response_temp, _ = inference(model, template, prompt, images=image,temperature=args.tempeature)
            response = extract_option(response_temp, question)
            answer_data_json = {
                'index': index,
                'question': question,
                'question_type': question_type,
                'choices':choices,
                'answer' : answer,
                'response': response,
                'response_temp': response_temp,
                'img_type' : img_type ,
                'topic_difficulty': topic_difficulty,
                'subfield' : subfield,
                'prompt': prompt
            }
            answer_new_F_T.append(answer_data_json)

        save_path= cacluate_current_time_save_path('false_true',args)
        json.dump(answer_new_F_T, open(save_path, 'w',encoding='utf-8'),
                        indent=2, ensure_ascii=False)

        consistent_ratio_false_true, inconsistent_ratio_false_true = calculate_consistency_MC(answer_new_F_T,'False->True-')


    logging.info(f"False Count:{len(filtered_data_false_true)}")
    for i in range(1):
        answer_new_F_F=[]
        for qid, item in enumerate(tqdm(filtered_data_false_true, desc="False->False")):
            index = item["index"]
            question = item["question"]
            question_type = item["question_type"]
            choices = item['choices']
            answer = item["answer"]
            img_type = item["img_type"]
            topic_difficulty = item["topic_difficulty"]
            subfield = item["subfield"]
            
            prompt= construct_query_MC(question,choices,select_random_choice(answer,len(choices)))

            image = os.path.join(args.local_image_path, index) + '.jpg'
            if args.api_model:
                response_temp = get_all_model_api_result(args, prompt, image)
            elif args.model_type == 'phi3-vision-128k-instruct':
                prompt = f'<img>{image}</img>{prompt}'
                response_temp, _ = inference(model, template, prompt, temperature=args.tempeature)
            else :
                response_temp, _ = inference(model, template, prompt, images=image,temperature=args.tempeature)
            response = extract_option(response_temp, question)
            answer_data_json = {
                'index': index,
                'question': question,
                'question_type': question_type,
                'choices':choices,
                'answer' : answer,
                'response': response,
                'response_temp': response_temp,
                'img_type' : img_type ,
                'topic_difficulty': topic_difficulty,
                'subfield' : subfield,
                'prompt': prompt
            }

            answer_new_F_F.append(answer_data_json)

        save_path= cacluate_current_time_save_path('false_false',args)
        json.dump(answer_new_F_F, open(save_path, 'w',encoding='utf-8'),
                        indent=2, ensure_ascii=False)

        consistent_ratio_false_true, inconsistent_ratio_false_true = calculate_consistency_MC(answer_new_F_F,'False->False-')


    logging.info(f"True Count:{len(filtered_data_true_false)}")
    for i in range(1):
        answer_new_T_F = []
        for qid, item in enumerate(tqdm(filtered_data_true_false, desc="True->False")):
            index = item["index"]
            question = item["question"]
            question_type = item["question_type"]
            choices = item['choices']
            answer = item["answer"]
            img_type = item["img_type"]
            topic_difficulty = item["topic_difficulty"]
            subfield = item["subfield"]
            
            prompt= construct_query_MC(question,choices,select_random_choice(answer,len(choices)))

            image = os.path.join(args.local_image_path, index) + '.jpg'
            if args.api_model:
                response_temp = get_all_model_api_result(args, prompt, image)
            elif args.model_type == 'phi3-vision-128k-instruct':
                prompt = f'<img>{image}</img>{prompt}'
                response_temp, _ = inference(model, template, prompt, temperature=args.tempeature)
            else :
                response_temp, _ = inference(model, template, prompt, images=image,temperature=args.tempeature)
            response = extract_option(response_temp, question)
            answer_data_json = {
                'index': index,
                'question': question,
                'question_type': question_type,
                'choices':choices,
                'answer' : answer,
                'response': response,
                'response_temp': response_temp,
                'img_type' : img_type ,
                'topic_difficulty': topic_difficulty,
                'subfield' : subfield,
                'prompt': prompt
            }

            answer_new_T_F.append(answer_data_json)

        save_path= cacluate_current_time_save_path('true_false',args)
        json.dump(answer_new_T_F, open(save_path, 'w',encoding='utf-8'),
                        indent=2, ensure_ascii=False)
        consistent_ratio_true_false, inconsistent_ratio_true_false = calculate_consistency_MC(answer_new_T_F, 'True->False')


    logging.info(f"True Count:{len(filtered_data_true_false)}")
    for i in range(1):
        answer_new_T_T=[]
        for qid, item in enumerate(tqdm(filtered_data_true_false, desc="True->True")):
            index = item["index"]
            question = item["question"]
            question_type = item["question_type"]
            choices = item['choices']
            answer = item["answer"]
            img_type = item["img_type"]
            topic_difficulty = item["topic_difficulty"]
            subfield = item["subfield"]
            
            prompt= construct_query_MC(question,choices,answer)
            
            image = os.path.join(args.local_image_path, index) + '.jpg'
            if args.api_model:
                response_temp = get_all_model_api_result(args, prompt, image)
            elif args.model_type == 'phi3-vision-128k-instruct':
                prompt = f'<img>{image}</img>{prompt}'
                response_temp, _ = inference(model, template, prompt, temperature=args.tempeature)
            else :
                response_temp, _ = inference(model, template, prompt, images=image,temperature=args.tempeature)
            response = extract_option(response_temp, question)
            answer_data_json = {
                'index': index,
                'question': question,
                'question_type': question_type,
                'choices':choices,
                'answer' : answer,
                'response': response,
                'response_temp': response_temp,
                'img_type' : img_type ,
                'topic_difficulty': topic_difficulty,
                'subfield' : subfield,
                'prompt': prompt
            }
            answer_new_T_T.append(answer_data_json)

        save_path= cacluate_current_time_save_path('true_true',args)
        json.dump(answer_new_T_T, open(save_path, 'w',encoding='utf-8'),
                        indent=2, ensure_ascii=False)
        consistent_ratio_true_false, inconsistent_ratio_true_false = calculate_consistency_MC(answer_new_T_T, 'True->True')
