import os
import json
import re
import ast
import base64
from openai import OpenAI

import sys
sys.path.append("/mnt/workspace/workgroup/zheliu.lzy/vision_cot/OminiControl")
from src.utils.prompt import gen_prompt, edit_prompt, identity_prompt

# openai_api_key = "sk-ad724c4ff96b4b02abdebfc854573d34"
openai_api_key = "sk-DH91dUEwKErjycXl516fAbAf693946D183B1070193E84806"
openai_api_key = "sk-9Elt3DNwnJzb7NL871481c256f5d4bEb80805aD72e5f508f"
# openai_api_key = "sk-pa2hox2dxHEPQ5ZxAfDcFc66C6B247Cd957aA045C9D69a1d"
openai_api_base = "https://api.bltcy.ai/v1"
model="gemini-2.5-pro-exp-03-25"
# gemini-2.5-pro-preview-03-25

# openai_api_key = "EMPTY"
# openai_api_base = "https://mlflow-debug-fg35th-006877-8000.cloud-ide.alibaba-inc.com/v1" # lzy
# openai_api_base = "https://mlflow-debug-qmccf1-010612-8080.cloud-ide.alibaba-inc.com/v1" # zqh
# model="Qwen/Qwen2.5-VL-72B-Instruct-AWQ",

def vlm_request(messages, model="gemini-2.5-pro-exp-03-25", max_retries=3, retry_delay=1, optim=False):
    # if optim:
    #     openai_api_key="5K5LQuiwumyirmh58Q4v6grxlep8ngeU"
    #     openai_api_base="https://api.deepinfra.com/v1/openai"
    #     model="google/gemini-2.5-pro"
    # else:
    #     openai_api_key="sk-9Elt3DNwnJzb7NL871481c256f5d4bEb80805aD72e5f508f"
    #     openai_api_base="https://api.bltcy.ai/v1"

    # openai_api_key="5K5LQuiwumyirmh58Q4v6grxlep8ngeU"
    openai_api_key="kKgaklj9R5HY5gmDFj3GK27UxUuZqX5P"
    openai_api_base="https://api.deepinfra.com/v1/openai"
    model="google/gemini-2.5-pro"
        
    client = OpenAI(
        api_key=openai_api_key,
        base_url=openai_api_base,
    )
    
    for attempt in range(max_retries):
        try:
            completion = client.chat.completions.create(
                model=model,
                messages=messages,
                # enable_thinking=False,
            )
            
            # 解析并验证响应结构
            response_json = json.loads(completion.model_dump_json())
            if 'choices' not in response_json or len(response_json['choices']) == 0:
                raise ValueError("Invalid API response: missing choices field")
            
            first_choice = response_json['choices'][0]
            if 'message' not in first_choice or 'content' not in first_choice['message']:
                raise ValueError("Invalid message structure in API response")
            content = first_choice['message']['content']
            return content
            
        except Exception as e:
            print(f"Attempt {attempt + 1} failed: {str(e)}")
            if attempt > max_retries - 1:
                print("All retry attempts exhausted.")
                raise  # 抛出最后捕获的异常

    return None  # 理论上不会执行到此处，因循环内已处理所有重试

def vlm_request_ori(messages, model="gemini-2.5-pro-exp-03-25", max_retries=3, retry_delay=1):
    openai_api_key="sk-9Elt3DNwnJzb7NL871481c256f5d4bEb80805aD72e5f508f"
    openai_api_base="https://api.bltcy.ai/v1"
        
    client = OpenAI(
        api_key=openai_api_key,
        base_url=openai_api_base,
    )
    
    for attempt in range(max_retries):
        try:
            completion = client.chat.completions.create(
                model=model,
                messages=messages,
                # enable_thinking=False,
            )
            
            # 解析并验证响应结构
            response_json = json.loads(completion.model_dump_json())
            if 'choices' not in response_json or len(response_json['choices']) == 0:
                raise ValueError("Invalid API response: missing choices field")
            
            first_choice = response_json['choices'][0]
            if 'message' not in first_choice or 'content' not in first_choice['message']:
                raise ValueError("Invalid message structure in API response")
            content = first_choice['message']['content']
            return content
            
        except Exception as e:
            print(f"Attempt {attempt + 1} failed: {str(e)}")
            if attempt > max_retries - 1:
                print("All retry attempts exhausted.")
                raise  # 抛出最后捕获的异常

    return None  # 理论上不会执行到此处，因循环内已处理所有重试

def extract_and_parse_json(text_string):
    """
    从包含 JSON 的字符串中提取并解析 JSON 数据。
    优先尝试提取被 '```json ... ```' 包裹的内容。
    如果找不到代码块，则尝试直接解析整个字符串（去除首尾空格后）。

    Args:
        text_string (str): 包含 JSON 数据的输入字符串。

    Returns:
        dict or list or None: 解析后的 Python 对象 (字典或列表)，
                             如果找不到有效的 JSON 或解析失败，则返回 None。
    """
    if not isinstance(text_string, str):
        print("输入不是一个字符串。")
        return None

    # 1. 尝试使用正则表达式查找 ```json ... ``` 代码块
    # re.DOTALL 让 '.' 匹配包括换行符在内的任何字符
    match = re.search(r'```json\s*(.*?)\s*```', text_string, re.DOTALL)

    json_str_to_parse = None

    if match:
        # 如果找到匹配项，提取第一个捕获组的内容
        json_str_to_parse = match.group(1).strip()
        # print("在 ```json 代码块中找到 JSON。")
    else:
        # 2. 如果未找到代码块，尝试将整个字符串视为 JSON（去除首尾空格）
        # 检查字符串是否至少看起来像一个 JSON 对象或数组
        stripped_string = text_string.strip()
        if (stripped_string.startswith('{') and stripped_string.endswith('}')) or \
           (stripped_string.startswith('[') and stripped_string.endswith(']')):
             json_str_to_parse = stripped_string
             # print("未找到 ```json 代码块，尝试直接解析。")
        else:
            # print("未找到代码块，字符串看起来也不像 JSON。")
            pass # 保持 json_str_to_parse 为 None

    # 3. 如果提取到了可能的 JSON 字符串，则尝试解析
    if json_str_to_parse:
        try:
            parsed_json = json.loads(json_str_to_parse)
            # print("JSON 解析成功。")
            return parsed_json
        except json.JSONDecodeError as e:
            print(f"JSON 解析失败: {e}")
            # 如果从代码块提取的内容解析失败，可以尝试备用方案（整个字符串）
            if match: # 仅当第一次尝试是从代码块提取时，才进行此回退
                 stripped_string = text_string.strip()
                 if (stripped_string.startswith('{') and stripped_string.endswith('}')) or \
                    (stripped_string.startswith('[') and stripped_string.endswith(']')):
                     print("代码块内容解析失败，尝试回退解析整个字符串...")
                     try:
                         parsed_json = json.loads(stripped_string)
                         print("回退解析成功。")
                         return parsed_json
                     except json.JSONDecodeError as e_fallback:
                         print(f"回退解析也失败了: {e_fallback}")
                         return None
            return None # 如果不是从代码块提取的，或者回退也失败了

    # 如果没有提取到任何内容，或者解析失败
    # print("未能提取或解析有效的 JSON。")
    return None

def extract_and_parse_list(text_string):
    """
    从包含 ```python ... ``` 代码块的字符串中提取 Python 列表。

    Args:
        text_string (str): 包含列表表示的输入字符串。

    Returns:
        list or None: 如果成功提取并解析为列表，则返回该列表，否则返回 None。
    """
    if not isinstance(text_string, str):
        print("错误：输入必须是字符串。")
        return None

    # 使用正则表达式查找 ```python ... ``` 块内的内容
    # re.DOTALL 标志让 '.' 可以匹配换行符
    match = re.search(r'```python\s*(.*?)\s*```', text_string, re.DOTALL)

    if match:
        list_string = match.group(1).strip() # 提取捕获组内容并去除首尾空格
        # print(f"提取到的字符串: '{list_string}'") # 调试信息
        try:
            # 使用 ast.literal_eval 安全地将字符串解析为 Python 对象
            # 它只能处理 Python 的字面量（字符串、数字、元组、列表、字典、布尔值、None）
            # 这可以防止执行恶意代码
            parsed_object = ast.literal_eval(list_string)

            # 确保解析结果确实是一个列表
            if isinstance(parsed_object, list):
                # print("解析成功，结果是列表。") # 调试信息
                return parsed_object
            else:
                print(f"错误：解析成功，但结果不是列表 (类型为: {type(parsed_object)})。")
                return None
        except (ValueError, SyntaxError, TypeError) as e:
            # 如果字符串不是有效的 Python 字面量，会抛出错误
            print(f"错误：解析字符串时出错 - {e}")
            return None
    else:
        # print("错误：未在字符串中找到 ```python ... ``` 代码块。") # 调试信息
        return None

if __name__ == "__main__":
    # image_path = "test/boat/flux.png"
    # with open(image_path, "rb") as f:
    #     base64_image = base64.b64encode(f.read()).decode('utf-8')
    
    # messages=[
    #     {
    #         "role": "user","content": [
    #             {"type": "text","text": "这是什么"},
    #             {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{base64_image}"}}
    #         ]
    #     }
    # ]
    global_prompt = "A green twintail girl in orange dress is sitting on the sofa while a messy desk under a big window on the left, a lively aquarium is on the top right of the sofa, realistic style"
    messages=[
        {
            "role": "user",
            "content": [
                # {"type": "text", "text": f"{generate_prompt}\nCaption: {global_prompt}"},
                # {"type": "text", "text": f"{gen_prompt}"},
                {"type": "text", "text": f"{identity_prompt.replace('<caption>', global_prompt)}"},
            ]
        }
    ]
    content = vlm_request(messages)
    answer = content.split('</think>')[-1]
    ans_json = extract_and_parse_json(answer)
    ans_list = extract_and_parse_list(answer)
    print(1)