from openai import OpenAI
import os
import json
import re
import base64
import httpx

os.environ["http_proxy"] = "http://localhost:7897"
os.environ["https_proxy"] = "http://localhost:7897"
# Use API key from environment variables (recommended method)
client = OpenAI(base_url='',
                http_client=httpx.Client(verify=False, timeout=60.0),
                api_key='') 

def image_to_base64(image_path):
    """Convert image to base64 string (required for GPT-4o)"""
    with open(image_path, "rb") as image_file:
        return base64.b64encode(image_file.read()).decode("utf-8")

def single_image_inference_gpt4o(image_path, input_text):
    # Load image and convert to base64
    base64_image = image_to_base64(image_path)

    response = client.chat.completions.create(
        model="gpt-4o",
        messages=[
            {
                "role": "user",
                "content": [
                    {"type": "text", "text": input_text},
                    {
                        "type": "image_url",
                        "image_url": {
                            "url": f"data:image/jpeg;base64,{base64_image}"
                        }
                    }
                ]
            }
        ],
        temperature=0.2,
        max_tokens=1024
    )

    return response.choices[0].message.content

def extract_step_conclusions(item):
    """Extract conclusions from all key_steps"""
    conclusions = []
    i = 1
    while True:
        step_key = f"key_step_{i}"  
        if step_key not in item:     
            break
        step_data = item[step_key]
        if "conclusion" in step_data:
            conclusions.append(step_data["conclusion"])
        i += 1
    return conclusions

def clean_model_response(response):

    # 1. Remove leading/trailing whitespace and BOM marker
    response = response.strip().replace('\ufeff', '')

    # 2. Remove non-JSON characters at the beginning (until the first [ or {)
    response = re.sub(r'^[^{[]*', '', response)

    # 3. Remove non-JSON characters at the end (after the last ] or })
    response = re.sub(r'[^}\]]*$', '', response)

    # 4. Special handling for common code markers (like ```json and ```)
    response = response.replace('```json', '').replace('```', '')

    # 5. Remove leading/trailing whitespace again
    return response.strip()

def process_experiment_folders(data_dir, output_dir, md_name, max_folders=1):
    """
    Process experiment folders (up to the specified number)
    
    Args:
        data_dir: Root directory of experiment folders
        model_path: Model path
        output_dir: Output directory
        md_name: Model name (used to find .md files)
        max_folders: Maximum number to process (default 10)
    """
    os.makedirs(output_dir, exist_ok=True)
    processed_count = 0

    for folder_name in os.listdir(data_dir):
        if processed_count >= max_folders:
            break
            
        folder_path = os.path.join(data_dir, folder_name)
        if not os.path.isdir(folder_path):
            continue

        output_subdir = os.path.join(output_dir, folder_name)
        os.makedirs(output_subdir, exist_ok=True)  # Add this line

        # Find JSON and image files
        json_file = next((f for f in os.listdir(folder_path) if f.endswith('.json')), None)
        # internvl_2.5_78B internvl_2.5MPO_78B internvl_3_78B internvl_3-instruct_78B llama3.2V-cot_11B llava_ov_72B qvq_72B qwen_2.5_vl_7B qwen_2.5_vl_72B
        # InternVL2_5-78B  InternVL2_5-78B-MPO InternVL3-78B-Instruct InternVL3-78B llama3.2V-cot-11B QVQ-72B qwen2_5vl-7b qwen2_5vl-72b
        md_file = next((f for f in os.listdir(folder_path) if f.lower().endswith(f'{md_name.lower()}.md')), None)
        raw_image = next((f for f in os.listdir(folder_path) if f.endswith('_raw.jpg') or f.endswith('_raw.png')), None)
        
        if not (json_file and raw_image and md_file):
            print(f"Skipping {folder_name}: Missing JSON, image, or MD file")
            processed_count += 1
            continue

        try:
            json_path = os.path.join(folder_path, json_file)
            md_path = os.path.join(folder_path, md_file)
            image_path = os.path.join(folder_path, raw_image)

            # Check if output file already exists and is not empty
            output_file = os.path.join(
                output_dir, 
                folder_name,
                f"{folder_name}_reflection.json"
            )
            
            if os.path.exists(output_file) and os.path.getsize(output_file) > 0:
                print(f"Skipping {folder_name}: Output file already exists and is not empty")
                processed_count += 1
                continue

            with open(json_path, 'r', encoding='utf-8') as f_json:
                json_content = json.load(f_json)
                with open(md_path, 'r', encoding='utf-8') as f_md:
                    md_content = f_md.read().strip()

                    # Handle array case
                    if isinstance(json_content, list):
                        for item in json_content:
                            if not (isinstance(item, dict) and 'query' in item):
                                continue
                    
                        conclusions = extract_step_conclusions(item)
                        # Use regex to match both English commas `,` and Chinese commas `，`
                        sentences = re.split(r'[,，.]', item['original_scene']['description'])  # Match both English and Chinese commas
                        sentences = [s.strip() for s in sentences if s.strip()]  # Remove whitespace and filter empty strings
                        # Build input text
                        input_text = (
                                "# Task\n"
                                "Evaluate reflection steps in image-based problem solutions, where reflections are self-corrections or reconsiderations of previous statements.\n"
                                "\n"
                                "# Reflection Step Identification \n"
                                "Reflections typically begin with phrases like:\n"
                                "- \"But xxx\"\n"
                                "- \"Alternatively, xxx\" \n"
                                "- \"Maybe I should\"\n"
                                "- \"Let me double-check\"\n"
                                "- \"Wait xxx\"\n"
                                "- \"Perhaps xxx\"\n"
                                "It will throw an doubt of its previously reached conclusion or raise a new thought.\n"
                                "\n"
                                "# Evaluation Criteria\n"
                                "Correct reflections must:\n"
                                "1. Reach accurate conclusions aligned with ground truth\n"
                                "2. Use new insights to find the mistake of the previous conclusion or verify its correctness. \n"
                                "\n"
                                "Invalid reflections include:\n"
                                "1. Repetition - Restating previous content or method without new insights\n"
                                "2. Wrong Conclusion - Reaching incorrect conclusions vs ground truth\n"
                                "3. Incompleteness - Proposing but not executing new analysis methods\n"
                                "4. Other - Additional error types\n"
                                "\n"
                                "# Output Requirements\n"
                                "1. The output format must be in valid JSON format without any other content.\n"
                                "2. Output maximum 30 reflection steps.\n"
                                "\n"
                                "Here is the json output format:\n"
                                "## Output Format\n"
                                "```json\n"
                                "[\n"
                                "  {{\n"
                                "    \"conclusion\": \"One-sentence summary of reflection outcome\",\n"
                                "    \"judgment\": \"Correct|Wrong\",\n"
                                "    \"error_type\": \"N/A|Repetition|Wrong Conclusion|Incompleteness|Other\"\n"
                                "  }}\n"
                                "]\n"
                                "```\n"
                                "\n"
                                "# Rules\n"
                                "1. Preserve original content and order\n"
                                "2. No new interpretations\n"
                                "3. Include ALL reflection steps\n"
                                "4. Empty list if no reflections found\n"
                                "5. Direct JSON output without any other output\n"
                                "\n"
                                "# Input Format\n"
                                "\n"
                                "[Problem]\n"
                                "\n"
                                f"{{{item['query']} }}\n"
                                "\n"
                                "[Solution]\n"
                                "\n"
                                f"{{{md_content} }}\n"
                                "[Ground Truth Information]\n"
                                "\n"
                                "{\n"
                        )

                        idx = 1
                        for i, sentence in enumerate(sentences, 1):
                            input_text += f"{i}. {sentence}\n"
                            idx += 1
                        for i, conclusion in enumerate(conclusions, 1):
                            input_text += f"{idx}. {conclusion}\n"
                            idx += 1
                        input_text+=(
                                "}\n"
                        )
                    
                        response = single_image_inference_gpt4o(image_path, input_text)
                        response=clean_model_response(response)

                        # Save results
                        with open(output_file, 'w', encoding='utf-8') as f_out:
                             f_out.write(response)
                        
                        print("Processed " + str(processed_count+1) + " data items")

                        processed_count += 1
                        
                        if processed_count >= max_folders:
                            break
                    else:
                        print(f"{json_path} is not a valid array format")
        except Exception as e:
            print(f"Error processing {folder_name}: {str(e)}")

if __name__ == "__main__":

    data_directory = r"D:\VSCode_Project\Project-MLLM\Mini-data\post-training\single\DynamicPrediction"

    # internvl2.5 internvl2.5MPO internvl3 internvl3-instruct llava-cot llavaov qvq qwen7b qwen72b
    output_directory = r"D:\VSCode_Project\Project-MLLM\Result\output_single_img\DynamicPrediction\r1_vl_2B"

    # internvl_2.5_78B internvl_2.5MPO_78B internvl_3_78B internvl_3-instruct_78B llama3.2V-cot_11B llava_ov_72B qvq_72B qwen_2.5_vl_7B qwen_2.5_vl_72B
    # InternVL2_5-78B  InternVL2_5-78B-MPO InternVL3-78B-Instruct InternVL3-78B llama3.2V-cot-11B QVQ-72B qwen2_5vl-7b qwen2_5vl-72b
    # eureka-7b, qwen_2_vl_2B, r1_vl_2B
    # MM-Eureka,qwen2-vl-2b, r1-vl-2b
    md_name = "r1_vl_2B"

    print("start!")
    
    # Execute processing (default max 1)
    process_experiment_folders(
        data_dir=data_directory,
        output_dir=output_directory,
        md_name = md_name,
        max_folders=100
    )
    print("Done!")




