# import os
# import json
# import torch
# from transformers import Glm4vForConditionalGeneration, AutoProcessor
# from tqdm import tqdm
# from PIL import Image

# # --- 1. 模型和处理器加载 ---
# model_id = "THUDM/GLM-4.1V-9B-Thinking"

# print(f"正在加载模型: {model_id}...")
# model = Glm4vForConditionalGeneration.from_pretrained(
#     model_id,
#     torch_dtype=torch.bfloat16,
#     low_cpu_mem_usage=True,
#     device_map="auto"
# )
# processor = AutoProcessor.from_pretrained(model_id, trust_remote_code=True)
# print("模型加载完成。")

# # --- 2. 路径和配置信息 ---
# base_data_dir = "."
# folders_to_process = ["Mongolia", "Vitnamese", "Singapore", "China"]
# output_dir = "Output_Json_GLM_VQA"
# os.makedirs(output_dir, exist_ok=True)

# # --- 3. 动态VQA提示词模板 (保持不变) ---
# VQA_PROMPT_TEMPLATES = {
#     "China": {
#         "Chinese": "请基于图像回答以下与中国文化相关的问题：\n{question}\n{options}\n这是一个多选题，请先返回所有可能的选项字母，再用中文解释你的选择。",
#         "English": "Based on the image, please answer the following question related to Chinese Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
#     },
#     "Indonesian": {
#         "Indonesian": "Berdasarkan gambar, silakan jawab pertanyaan berikut terkait Budaya Indonesia.\n{question}\n{options}\nIni adalah pertanyaan pilihan ganda. Harap kembalikan semua kemungkinan huruf opsi terlebih dahulu, lalu jelaskan pilihan Anda dalam Bahasa Indonesia.",
#         "English": "Based on the image, please answer the following question related to Indonesian Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
#     },
#     "Korea": {
#         "Korean": "이미지를 바탕으로 다음 한국 문화와 관련된 질문에 답변해 주세요.\n{question}\n{options}\n이것은 객관식 문제입니다. 먼저 가능한 모든 옵션 문자를 반환한 다음, 한국어로 당신의 선택을 설명해 주세요.",
#         "English": "Based on the image, please answer the following question related to Korean Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
#     },
#     "Mongolia": {
#         "Mongolian": "Зурагт үндэслэн Монголын соёлтой холбоотой дараах асуултад хариулна уу.\n{question}\n{options}\nЭнэ бол олон сонголттой асуулт юм. Эхлээд боломжит бүх сонголтын үсгийг буцааж, дараа нь сонголтоо монгол хэлээр тайлбарлана уу.",
#         "English": "Based on the image, please answer the following question related to Mongolian Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
#     },
#     "Singapore": {
#         "English": "Based on the image, please answer the following question related to Singaporean Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English.",
#         "Malay": "Berdasarkan imej, sila jawab soalan berikut yang berkaitan dengan Budaya Singapura.\n{question}\n{options}\nIni adalah soalan pilihan berganda. Sila kembalikan semua huruf pilihan yang mungkin terlebih dahulu, kemudian jelaskan pilihan anda dalam Bahasa Inggeris.",
#         "Chinese": "请基于图像回答以下与新加坡文化相关的问题。\n{question}\n{options}\n这是一个多选题，请先返回所有可能的选项字母，再用英文解释你的选择。",
#     },
#     "Vitnamese": {
#         "Vietnamese": "Dựa vào hình ảnh, vui lòng trả lời câu hỏi sau đây liên quan đến Văn hóa Việt Nam.\n{question}\n{options}\nĐây là một câu hỏi trắc nghiệm. Vui lòng trả về tất cả các chữ cái tùy chọn có thể có trước, sau đó giải thích lựa chọn của bạn bằng tiếng Việt.",
#         "English": "Based on the image, please answer the following question related to Vietnamese Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
#     }
# }
# NATIVE_LANGUAGE_MAP = {
#     "Indonesian": "Indonesian", "Korea": "Korean", "Mongolia": "Mongolian",
#     "Singapore": "Malay,Chinese", "Vitnamese": "Vietnamese", "China": "Chinese"
# }

# # --- 4. 遍历文件夹和文件进行处理 ---
# for folder_name in folders_to_process:
#     current_folder_path = os.path.join(base_data_dir, folder_name)
#     if not os.path.isdir(current_folder_path):
#         print(f"⚠️  警告: 文件夹 '{current_folder_path}' 不存在，已跳过。")
#         continue
#     print(f"\n📁 开始处理文件夹: {current_folder_path}")

#     for filename in os.listdir(current_folder_path):
#         if "Text_Only" not in filename and filename.endswith(".json"):
#             input_path = os.path.join(current_folder_path, filename)
#             print(f"  ➡️  正在处理VQA文件: {filename}")

#             try:
#                 with open(input_path, "r", encoding="utf-8") as f:
#                     data = json.load(f)
#             except Exception as e:
#                 print(f"    ❌ 读取文件失败: {input_path}, 错误: {e}")
#                 continue

#             # 确定语言和Prompt模板
#             if "English" in filename:
#                 language = "English"
#             else:
#                 language = NATIVE_LANGUAGE_MAP.get(folder_name, "English")
            
#             prompt_template = None
#             if len(language.split(",")) == 1:
#                 prompt_template = VQA_PROMPT_TEMPLATES[folder_name][language]
#             else:
#                 for l in language.split(","):
#                     if l in filename:
#                         prompt_template = VQA_PROMPT_TEMPLATES[folder_name][l]
#                         break
            
#             if not prompt_template:
#                 print(f"    ❌ 未能为文件 {filename} 找到匹配的Prompt模板，跳过。")
#                 continue

#             for item in tqdm(data, desc=f"  Processing items in {filename}", leave=False):
#                 answer_key = "glm_4_1v_answer"
#                 try:
#                     if "Image_path" not in item or not item["Image_path"]:
#                         item[answer_key] = "Error: Image_path is missing or empty."
#                         continue

#                     full_image_path = os.path.join(current_folder_path, item["Image_path"])
#                     if not os.path.exists(full_image_path):
#                         item[answer_key] = f"Error: Image file not found at {full_image_path}"
#                         continue
                    
#                     image = Image.open(full_image_path).convert("RGB")

#                     question = item.get("Question", "").strip()
#                     options = [f"A. {str(item.get('Option1', '')).strip()}", f"B. {str(item.get('Option2', '')).strip()}",
#                                f"C. {str(item.get('Option3', '')).strip()}", f"D. {str(item.get('Option4', '')).strip()}"]
#                     text_prompt = prompt_template.format(question=question, options="\n".join(options))

#                     # **关键更正**: 将PIL.Image对象直接嵌入到messages列表中
#                     messages = [
#                         {
#                             "role": "user",
#                             "content": [
#                                 {"type": "image", "image": image}, # 直接传入加载好的image对象
#                                 {"type": "text", "text": text_prompt}
#                             ],
#                         }
#                     ]

#                     # **关键更正**: apply_chat_template 现在直接处理内嵌的图像
#                     inputs = processor.apply_chat_template(
#                         messages,
#                         tokenize=True,
#                         add_generation_prompt=True,
#                         return_dict=True,
#                         return_tensors="pt"
#                     ).to(model.device)

#                     with torch.no_grad():
#                         generated_ids = model.generate(**inputs, max_new_tokens=2048, do_sample=False)
                    
#                     input_ids_len = inputs['input_ids'].shape[1]
#                     generated_ids_trimmed = generated_ids[0][input_ids_len:]
#                     output_text = processor.decode(
#                         generated_ids_trimmed, skip_special_tokens=True, clean_up_tokenization_spaces=False
#                     ).strip()

#                     item[answer_key] = output_text

#                 except Exception as e:
#                     item[answer_key] = f"Error: {str(e)}"

#             # 保存更新后的数据
#             base_filename = os.path.splitext(filename)[0]
#             output_filename = f"{base_filename}_glm4_1v_answered.json"
#             output_path = os.path.join(output_dir, output_filename)

#             with open(output_path, "w", encoding="utf-8") as f:
#                 json.dump(data, f, indent=2, ensure_ascii=False)

#             print(f"    ✅ VQA处理完成，结果已保存至: {output_path}")

# print(f"\n🎉 所有文件夹的VQA任务处理完毕！所有输出文件已保存到 '{output_dir}' 文件夹中。")

import os
import json
import torch
from transformers import Glm4vForConditionalGeneration, AutoProcessor
from tqdm import tqdm
from PIL import Image

# --- 1. 模型和处理器加载 (保持不变) ---
model_id = "THUDM/GLM-4.1V-9B-Thinking"

print(f"正在加载模型: {model_id}...")
model = Glm4vForConditionalGeneration.from_pretrained(
    model_id,
    torch_dtype=torch.bfloat16,
    device_map="auto"
)
processor = AutoProcessor.from_pretrained(model_id, trust_remote_code=True)
print("模型加载完成。")

# --- 2. 路径和配置信息 (保持不变) ---
base_data_dir = "."
folders_to_process = ["Japan", "China"]
output_dir = "Output_Json_GLM_VQA"
os.makedirs(output_dir, exist_ok=True)
answer_key = "glm_4_1v_answer" # 定义一个统一的key来存放答案

# --- 3. 动态VQA提示词模板 (保持不变) ---
VQA_PROMPT_TEMPLATES = {
    # ... (模板内容和原来一样，此处省略) ...
    "China": {
        "Chinese": "请基于图像回答以下与中国文化相关的问题：\n{question}\n{options}\n这是一个多选题，请先返回所有可能的选项字母，再用中文解释你的选择。",
        "English": "Based on the image, please answer the following question related to Chinese Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
    },
    "Indonesian": {
        "Indonesian": "Berdasarkan gambar, silakan jawab pertanyaan berikut terkait Budaya Indonesia.\n{question}\n{options}\nIni adalah pertanyaan pilihan ganda. Harap kembalikan semua kemungkinan huruf opsi terlebih dahulu, lalu jelaskan pilihan Anda dalam Bahasa Indonesia.",
        "English": "Based on the image, please answer the following question related to Indonesian Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
    },
    "Korea": {
        "Korean": "이미지를 바탕으로 다음 한국 문화와 관련된 질문에 답변해 주세요.\n{question}\n{options}\n이것은 객관식 문제입니다. 먼저 가능한 모든 옵션 문자를 반환한 다음, 한국어로 당신의 선택을 설명해 주세요.",
        "English": "Based on the image, please answer the following question related to Korean Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
    },
    "Mongolia": {
        "Mongolian": "Зурагт үндэслэн Монголын соёлтой холбоотой дараах асуултад хариулна уу.\n{question}\n{options}\nЭнэ бол олон сонголттой асуулт юм. Эхлээд боломжит бүх сонголтын үсгийг буцааж, дараа нь сонголтоо монгол хэлээр тайлбарлана уу.",
        "English": "Based on the image, please answer the following question related to Mongolian Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
    },
    "Singapore": {
        "English": "Based on the image, please answer the following question related to Singaporean Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English.",
        "Malay": "Berdasarkan imej, sila jawab soalan berikut yang berkaitan dengan Budaya Singapura.\n{question}\n{options}\nIni adalah soalan pilihan berganda. Sila kembalikan semua huruf pilihan yang mungkin terlebih dahulu, kemudian jelaskan pilihan anda dalam Bahasa Inggeris.",
        "Chinese": "请基于图像回答以下与新加坡文化相关的问题。\n{question}\n{options}\n这是一个多选题，请先返回所有可能的选项字母，再用英文解释你的选择。",
    },
    "Vitnamese": {
        "Vietnamese": "Dựa vào hình ảnh, vui lòng trả lời câu hỏi sau đây liên quan đến Văn hóa Việt Nam.\n{question}\n{options}\nĐây là một câu hỏi trắc nghiệm. Vui lòng trả về tất cả các chữ cái tùy chọn có thể có trước, sau đó giải thích lựa chọn của bạn bằng tiếng Việt.",
        "English": "Based on the image, please answer the following question related to Vietnamese Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
    },
    "Japan": {
        "Japanese": "日本文化に関する次の質問に答えてください。\n{question}\n{options}\nこれは多肢選択式の質問です。まずすべての可能な選択肢のアルファベットを返し、その後にあなたの選択を英語で説明してください。",
        "English": "Please answer the following question related to Japanese Culture.\n{question}\n{options}\nThis is a multiple-choice question. Please first return all possible option letters, then explain your choice in English."
    },
}
NATIVE_LANGUAGE_MAP = {
    "Indonesian": "Indonesian",
    "Korea": "Korean",
    "Mongolia": "Mongolian",
    "Singapore": "Malay,Chinese",
    "Vitnamese": "Vietnamese",
    "Japan": "Japanese"
}


# --- 4. 遍历文件夹和文件进行处理 (核心修改区域) ---
for folder_name in folders_to_process:
    current_folder_path = os.path.join(base_data_dir, folder_name)
    if not os.path.isdir(current_folder_path):
        print(f"⚠️  警告: 文件夹 '{current_folder_path}' 不存在，已跳过。")
        continue
    print(f"\n📁 开始处理文件夹: {current_folder_path}")

    for filename in os.listdir(current_folder_path):
        if "Text_Only" in filename or not filename.endswith(".json"):
            continue

        input_path = os.path.join(current_folder_path, filename)
        
        # --- 新增: 确定输出路径 ---
        base_filename = os.path.splitext(filename)[0]
        output_filename = f"{base_filename}_glm4_1v_answered.json"
        output_path = os.path.join(output_dir, output_filename)
        
        print(f"  ➡️  正在处理VQA文件: {filename}")
        print(f"      结果将保存至: {output_path}")

        try:
            with open(input_path, "r", encoding="utf-8") as f:
                input_data = json.load(f)
        except Exception as e:
            print(f"    ❌ 读取输入文件失败: {input_path}, 错误: {e}")
            continue
            
        # --- 新增: 断点续传逻辑 ---
        processed_items_lookup = set()
        if os.path.exists(output_path):
            try:
                with open(output_path, "r", encoding="utf-8") as f:
                    # 读取已有的结果
                    existing_data = json.load(f)
                # 创建一个已处理项的查找集合，使用 Image_path 作为唯一标识符
                for item in existing_data:
                    if item.get("Image_path") and answer_key in item:
                        processed_items_lookup.add(item["Image_path"])
                print(f"    🔍 发现已存在的输出文件，加载了 {len(processed_items_lookup)} 条已处理记录。")
                # 使用已有的数据作为起点
                results_data = existing_data
            except (json.JSONDecodeError, IOError) as e:
                print(f"    ⚠️ 读取现有输出文件失败: {output_path}, 将重新开始。错误: {e}")
                results_data = [] # 如果旧文件损坏，则从头开始
        else:
            results_data = [] # 如果没有输出文件，则从一个空列表开始
        
        # --- 修改: 准备语言和模板 (逻辑不变) ---
        if "English" in filename:
            language = "English"
        else:
            language = NATIVE_LANGUAGE_MAP.get(folder_name, "English")
        
        prompt_template = None
        if len(language.split(",")) == 1:
            prompt_template = VQA_PROMPT_TEMPLATES[folder_name][language]
        else:
            for l in language.split(","):
                if l in filename:
                    prompt_template = VQA_PROMPT_TEMPLATES[folder_name][l]
                    break
        
        if not prompt_template:
            print(f"    ❌ 未能为文件 {filename} 找到匹配的Prompt模板，跳过。")
            continue

        # --- 修改: 循环处理，增加跳过和即时保存逻辑 ---
        with tqdm(total=len(input_data), desc=f"  Processing {filename}", leave=False) as pbar:
            # 初始化进度条，让它能正确反映跳过和处理的项
            pbar.update(len(processed_items_lookup))

            for item in input_data:
                # 检查此项是否已经处理过
                if item.get("Image_path") in processed_items_lookup:
                    continue # 如果处理过，直接跳到下一个
                
                try:
                    # --- 以下是原始的推理逻辑 ---
                    if "Image_path" not in item or not item["Image_path"]:
                        item[answer_key] = "Error: Image_path is missing or empty."
                        continue

                    full_image_path = os.path.join(current_folder_path, item["Image_path"])
                    if not os.path.exists(full_image_path):
                        item[answer_key] = f"Error: Image file not found at {full_image_path}"
                        continue
                    
                    image = Image.open(full_image_path).convert("RGB")

                    question = item.get("Question", "").strip()
                    options = [f"A. {str(item.get('Option1', '')).strip()}", f"B. {str(item.get('Option2', '')).strip()}",
                               f"C. {str(item.get('Option3', '')).strip()}", f"D. {str(item.get('Option4', '')).strip()}"]
                    text_prompt = prompt_template.format(question=question, options="\n".join(options))

                    messages = [
                        {"role": "user", "content": [{"type": "image", "image": image}, {"type": "text", "text": text_prompt}]}
                    ]

                    inputs = processor.apply_chat_template(
                        messages, tokenize=True, add_generation_prompt=True, return_dict=True, return_tensors="pt"
                    ).to(model.device)

                    with torch.no_grad():
                        generated_ids = model.generate(**inputs, max_new_tokens=2048, do_sample=False)
                    
                    input_ids_len = inputs['input_ids'].shape[1]
                    generated_ids_trimmed = generated_ids[0][input_ids_len:]
                    output_text = processor.decode(
                        generated_ids_trimmed, skip_special_tokens=True, clean_up_tokenization_spaces=False
                    ).strip()

                    item[answer_key] = output_text

                except Exception as e:
                    item[answer_key] = f"Error: {str(e)}"
                
                finally:
                    # --- 核心改动: 无论成功或失败，都将处理过的 item 添加到结果中并立即保存 ---
                    results_data.append(item)
                    
                    # 写入文件
                    with open(output_path, "w", encoding="utf-8") as f:
                        json.dump(results_data, f, indent=2, ensure_ascii=False)
                    
                    # 更新进度条
                    pbar.update(1)


        print(f"    ✅ VQA处理完成: {filename}")

print(f"\n🎉 所有文件夹的VQA任务处理完毕！所有输出文件已保存到 '{output_dir}' 文件夹中。")
