from utils import LLMClient
import asyncio  
import time
import json
import os
import re
from tqdm import tqdm
import shutil
from llm_utils import clean_response, extract_triple_single_quote_json
import sys
import cv2
savejsonl = True
json_arr = []

test_model = 'llm'

def create_prompt(code, all_questions):
    return f"""You are given a python code that is used to generate a video to simulate the motion of objects.

Your task is to **evaluate each question** based on whether it is **correctly reflected in the python code**. If the answer of question 1 or question 2 is not true, then other questions should be answered as "False".


 **Input**:
- Questions: {all_questions}
- Code: {code}

---

 **For each question**, return:
- `"index"`: the question index
- `"question"`: the full question text
- `"analysis"`: your reasoning process and visual inference
- `"result"`: one of `"True"`, `"False"`, or `"Not sure"`
- `"confidence_score"`: an integer from 1 (very uncertain) to 5 (very certain)

---

**Output Format**:
Return a JSON list like this:
[
    {{
        "index": "1",
        "question": "The ball rolls along the circular path.",
        "analysis": "The object follows a closed curve consistent with a circular path from the top view.",
        "result": "True",
        "confidence_score": "5"
    }},
    ...
]
"""

async def main():
    valid_question_num = 0
    Model_name = "Qwen/Qwen2.5-72B-Instruct"
    index = 0
    client = LLMClient(model=Model_name, timeout_seconds=10000, temperature=0.0)
    for i in range(0, 443, 1):
        folder_id = 0
        json_path = f'finaldata1/val/all/video_{i}.json'
        code_folder = f'result/think/batch_0/video_{i}'
        if not os.path.exists(json_path) or not os.path.exists(code_folder):
            continue
        try:
        # if True:
            with open(json_path, "r", encoding="utf-8") as f:
                item = json.load(f)
            origin_question = item['question']
            
            try:
                after_verify = item['vlm_questions']
            except:
                print(type(item['vlm_questions']))
                print(f'after_verify error: {json_path}')
                break
            if after_verify['enableAnnotator'] == 'No' or len(after_verify['vlm_questions']) == 0:
                continue
            valid_question_num += 1
            all_questions = '1. Is the code can be executed? 2. Is the code can generate video?'
            all_weight= []
            try:
                for vlmindex in range(len(after_verify['vlm_questions'])):
                    subquestion = after_verify['vlm_questions'][vlmindex]['question']
                    all_questions += f'{vlmindex+3}. {subquestion}'
            except:
                print(json_path)

            
            for video_name in os.listdir(code_folder):
                with open(f"{code_folder}/{video_name}", "r", encoding="utf-8") as f:
                    msg = f.read()
                jdata = json.loads(msg)
                code = jdata['think']
                code = clean_response(code)
                code = extract_triple_single_quote_code(code)
                
                messages = [
                    {
                        "role": "user",
                        "content": 
                            [{
                                "type": "text", 
                                "text": create_prompt(code[0], all_questions)
                            }]
                    }]
                    #                             
                if savejsonl:
                    json_arr.append({
                        "messages": messages,
                        "id": i,
                        "document": json_path,
                        "video": f"{code_folder}/{video_name}"
                    })
                else:
                    responses = await client.process_all_inputs([messages], model=Model_name)
                    try:
                        final_json = extract_triple_single_quote_json(responses[0][0])
                        if final_json:
                            print(final_json)
                    except:
                        print(video_name, responses)
        except Exception as e:
            print(f'error: {json_path}, {e}')
    if savejsonl:
        with open(f"valresult/val_llm.jsonl", "w", encoding="utf-8") as f:
            for item in json_arr:
                f.write(json.dumps(item, ensure_ascii=False) + "\n")
    print(f'valid_question_num: {valid_question_num}')

    return
def transfer_signal(text):
    if '\n' in text:
        text = text[3:-3]
    text = text.replace("\"", "\\\"")
    return text
def process_jsonl():
    total_num = 0
    process_num = 0
    null_num = 0
    batch_index = 0
    with open(f"valresult/run_val_{test_model}_responses.jsonl", "r", encoding="utf-8") as f:
        for i, row in tqdm(enumerate(f)):
            item = json.loads(row)
            total_num += 1
            folder_id = int(item['id']) // 2500
            id = item['id']
            document = item['document']
            video = item['video']
            with open(document, "r", encoding="utf-8") as f:
                setting = json.load(f)
            origin_question = setting['question']
            level = setting['Level']
            vlm_questions = setting['vlm_questions']['vlm_questions']
            
            weight_arr = []
            for vlmindex in range(len(vlm_questions)):
                weight_arr.append(vlm_questions[vlmindex]['weight'])

            for index, response in enumerate(item['responses']):             
                if response is None:
                    null_num += 1
                    continue
                save_name = f"{os.path.basename(video).replace('.json', '')}_{batch_index}.json"
                try:
                    result = clean_response(response)
                except:
                    print('first:', response)
                    raise Exception(f'{json_folder}/{save_name}')
                    break
                try:
                    json.loads(result)
                except:
                    filter_result = extract_triple_single_quote_json(result)
                    if len(filter_result) > 0:
                        result = filter_result
                    else:
                        if type(result) != list:
                            result = [result]
                
                try:  
                    result[0] = result[0].replace('\\(', '\\\\(').replace('\\)', '\\\\)')
                    result[0] = result[0].replace('"\n', '",\n')
                    result[0] = re.sub(r',\n\s*}', r'\n}', result[0])
                    result[0] = re.sub(r':(\s)\n', r':\1', result[0])
                    result = json.loads(result[0])
                except:
                    try:
                        matches = re.findall(r': ".*"}?,\s*\n', result[0])
                        confidence_matches = re.findall(r'"confidence_score":\s*"?(\d+)"?,?\n', result[0])
                        new_result = []
                        for jindex in range(0, len(matches), 4):
                            new_result.append({
                                "index": transfer_signal(matches[jindex]),
                                "question": transfer_signal(matches[jindex+1]),
                                "analysis": transfer_signal(matches[jindex+2]),
                                "result": transfer_signal(matches[jindex+3]),
                                "confidence_score": confidence_matches[jindex//4]
                            })
                        result = new_result
                    except:
                        print(f'second error:{json_folder}/{save_name}')
                json_folder = f'result/valresult/{test_model}/batch_0/video_{id}'
                os.makedirs(json_folder, exist_ok=True)
                save_json = {
                    "document": document,
                    "video": video,
                    "weight": weight_arr, 
                    "vlm_result": result,
                }
                with open(f'{json_folder}/{save_name}', 'w', encoding='utf-8') as f:
                    json.dump(save_json, f, indent = 4, ensure_ascii=False)
                process_num += 1
        print(f'process_num: {process_num}, total_num: {total_num}, null_num: {null_num}, error_num: {total_num - process_num - null_num}')

            

if __name__ == "__main__":
    if sys.argv[1] == 'main':
        print('get run.jsonl')
        asyncio.run(main())
    elif sys.argv[1] == 'process_jsonl':
        print('process_jsonl')
         process_jsonl()