import json
import logging
import re
import asyncio
import copy
from llms.llms import async_call_llm
from utils.wordCounter import count_words
from json_repair import repair_json

class GenerationAgent:

    @staticmethod
    async def async_generate(model, example, semaphore):
        # 深拷贝输入数据，避免修改原始数据
        example = copy.deepcopy(example)
        
        # 先标准化数据结构，确保格式正确
        if 'weekly_plan' in example:
            if not isinstance(example['weekly_plan'], list):
                if isinstance(example['weekly_plan'], str):
                    example['weekly_plan'] = [{"week_id": "Week 1", "events": example['weekly_plan']}]
                elif isinstance(example['weekly_plan'], dict):
                    example['weekly_plan'] = [example['weekly_plan']]
                else:
                    example['weekly_plan'] = []
        
        if example['type'] == 'Week':
            example = await GenerationAgent.async_generate_week(model, example, semaphore)
        elif example["type"] == "Floor":
            example = await GenerationAgent.async_generate_floor(model, example, semaphore)
        elif example["type"] == "Menu Week":
            example = await GenerationAgent.async_generate_menu(model, example, semaphore)
        elif example["type"] == "Block":
            example = await GenerationAgent.async_generate_block(model, example, semaphore)
        return example

    @staticmethod
    async def async_generate_week(model, example, semaphore):
        # 确保 weekly_plan 是列表
        if 'weekly_plan' not in example or not example['weekly_plan']:
            example['weekly_plan'] = []
        elif not isinstance(example['weekly_plan'], list):
            if isinstance(example['weekly_plan'], str):
                example['weekly_plan'] = [{"week_id": "Week 1", "events": example['weekly_plan']}]
            elif isinstance(example['weekly_plan'], dict):
                example['weekly_plan'] = [example['weekly_plan']]
            else:
                example['weekly_plan'] = []

        # 创建一个新列表来保存处理后的周计划
        processed_weeks = []
        
        # 确保每个元素都包含必要字段
        for i, week in enumerate(example['weekly_plan']):
            # 如果元素不是字典，创建一个新字典
            if not isinstance(week, dict):
                processed_week = {"week_id": f"Week {i+1}", "events": str(week)}
            else:
                # 创建原始字典的深拷贝
                processed_week = copy.deepcopy(week)
                
                # 添加必要字段
                if 'week_id' not in processed_week:
                    processed_week['week_id'] = f"Week {i+1}"
                if 'events' not in processed_week:
                    processed_week['events'] = ""
            
            processed_weeks.append(processed_week)
        
        # 用处理后的列表替换原始列表
        example['weekly_plan'] = processed_weeks

        async def process_week(week):
            # 不再需要检查week是否为字典，因为之前已经确保了所有元素都是字典
            week_id = week.get('week_id', "Unknown Week")
            events = week.get('events', "")
            
            # 确保events是字符串
            if not isinstance(events, str):
                if isinstance(events, list):
                    events = ", ".join([str(event) for event in events])
                else:
                    events = str(events)
            
            prompt = f"""You are an expert writer. 
Write a 200-word weekly diary entry for the week of {week_id}.
The events for this week are: {events}
You should consider the coherence of the diary entry referring to the plan of the whole year:
{example['weekly_plan']}
You should consider the user requirements: {example['prompt']}
Check from the user requirements if there are any special events that should be included in the diary entry. If there are, include them in the diary entry. If there are no special events, write a general diary entry for the week.
Return the diary entry in the following json format:
{{
    "week_id": "{week_id}",
    "check": "reason and check if the user requirements are met",
    "diary_entry": "Your 200-word diary entry here" 
}}
"""
            logging.info(f"Generating initial diary entry for week {week_id}")

            # 最多尝试3次获取有效响应
            max_attempts = 3
            for attempt in range(max_attempts):
                async with semaphore:
                    response = await async_call_llm(model, prompt)
                
                # repair the json string
                try:
                    response = repair_json(response)
                    
                    # 寻找JSON对象
                    match = re.search(r"\{.*\}", response, re.DOTALL)
                    if match:
                        response_json = match.group(0)
                        
                        try:
                            diary_entry = json.loads(response_json)
                            
                            # 检查必要的键是否存在
                            if 'diary_entry' in diary_entry:
                                week['diary_entry'] = diary_entry['diary_entry']
                                # 确保diary_entry是字符串
                                if not isinstance(week['diary_entry'], str):
                                    week['diary_entry'] = str(week['diary_entry'])
                                week['length_requirement'] = 200
                                logging.info(f"Diary entry word count: {count_words(week['diary_entry'])}")
                                break
                            else:
                                # 尝试从其他可能的键中获取内容
                                for possible_key in ['entry', 'content', 'text', 'diary']:
                                    if possible_key in diary_entry:
                                        week['diary_entry'] = diary_entry[possible_key]
                                        if not isinstance(week['diary_entry'], str):
                                            week['diary_entry'] = str(week['diary_entry'])
                                        week['length_requirement'] = 200
                                        logging.info(f"Used alternative key '{possible_key}' for diary entry")
                                        break
                                
                                # 如果仍然没有找到合适的键，使用整个响应文本
                                if 'diary_entry' not in week and attempt == max_attempts - 1:
                                    # 去除JSON格式，保留文本内容
                                    text_content = re.sub(r'[{}"\'week_id[^:]*:|check[^:]*:|\s*]', '', response_json)
                                    week['diary_entry'] = text_content.strip() or f"Weekly diary for {week_id}."
                                    week['length_requirement'] = 200
                                    logging.warning(f"Created fallback diary entry from JSON text for {week_id}")
                        except json.JSONDecodeError:
                            if attempt == max_attempts - 1:  # 最后一次尝试
                                week['diary_entry'] = f"Weekly diary for {week_id}."
                                week['length_requirement'] = 200
                                logging.warning(f"JSON decode error, created fallback diary entry for {week_id}")
                    else:
                        # 如果没有找到JSON，使用整个响应文本
                        if attempt == max_attempts - 1:  # 最后一次尝试
                            week['diary_entry'] = response.strip() or f"Weekly diary for {week_id}."
                            week['length_requirement'] = 200
                            logging.warning(f"No JSON found, using full response as diary entry for {week_id}")
                except Exception as e:
                    logging.error(f"Error processing response for {week_id}: {e}")
                    if attempt == max_attempts - 1:  # 最后一次尝试
                        week['diary_entry'] = f"Weekly diary for {week_id}."
                        week['length_requirement'] = 200
                        logging.warning(f"Exception occurred, created fallback diary entry for {week_id}")

            # 确保diary_entry字段存在
            if 'diary_entry' not in week:
                week['diary_entry'] = f"Weekly diary for {week_id}."
                week['length_requirement'] = 200
                logging.warning(f"Created fallback diary entry for {week_id}")

            # Refine the diary entry
            try:
                current_length = count_words(week['diary_entry'])
                required_length = week['length_requirement']

                word_diff = abs(required_length - current_length)

                while word_diff > (required_length * 0.1):
                    refinement_prompt = f"""You are an expert editor. The provided text need to be {"shorten" if current_length > required_length else "lengthen"} by {word_diff} words while maintaining the original meaning and coherence.
                    Text:
                    {week['diary_entry']}
                    Return only the refined text."""

                    logging.info(f"Refining text for week {week_id}")
                    async with semaphore:
                        refined_text = await async_call_llm(model, refinement_prompt)
                    
                    if refined_text and len(refined_text) > 10:
                        week['diary_entry'] = refined_text.strip()
                        logging.info(f"Refined text: {week['diary_entry'][:50]}...")
                    else:
                        break  # 如果获取到的文本太短，不再尝试优化
                    
                    current_length = count_words(week['diary_entry'])
                    word_diff = abs(required_length - current_length)
                    
                    if word_diff <= (required_length * 0.1):
                        break
            except Exception as e:
                logging.error(f"Error during refinement for {week_id}: {e}")
            
            logging.info(f"Final diary entry word count: {count_words(week['diary_entry'])}")
            return week

        # Process all weeks concurrently
        tasks = [process_week(week) for week in example['weekly_plan']]
        
        try:
            processed_results = await asyncio.gather(*tasks)
            example['weekly_plan'] = processed_results
        except Exception as e:
            logging.error(f"Error during concurrent processing: {e}")
            # 确保至少有一些结果
            processed_results = []
            for week in example['weekly_plan']:
                try:
                    if 'diary_entry' not in week:
                        week['diary_entry'] = f"Weekly diary for {week.get('week_id', 'Unknown Week')}."
                        week['length_requirement'] = 200
                    processed_results.append(week)
                except Exception as inner_e:
                    logging.error(f"Error processing individual week: {inner_e}")
                    # 添加一个默认的周计划以保持结构完整
                    processed_results.append({
                        "week_id": "Unknown Week",
                        "diary_entry": "Weekly diary entry placeholder.",
                        "length_requirement": 200
                    })
        
        example['final_text'] = GenerationAgent.get_final_week_text(example['weekly_plan'])
        return example

    @staticmethod
    def get_final_week_text(weekly_plan):
        """
        Get the final text from the generated text with respect to the plan.
        """
        text = ""

        for week in weekly_plan:
            if isinstance(week, dict):
                week_id = str(week.get('week_id', "Unknown Week"))
                # 确保diary_entry是字符串
                diary_entry = week.get('diary_entry', "")
                if not isinstance(diary_entry, str):
                    diary_entry = str(diary_entry)
                text += '#*# ' + week_id + ':' + diary_entry
            else:
                # 简单转为字符串
                text += '#*# Unknown Week:' + str(week)

        text += '*** finished ***'
        return text

    @staticmethod
    async def async_generate_floor(model, example, semaphore):
        # 确保 floor_plan 是列表
        if 'floor_plan' not in example or not example['floor_plan']:
            example['floor_plan'] = []
        elif not isinstance(example['floor_plan'], list):
            if isinstance(example['floor_plan'], str):
                example['floor_plan'] = [{"floor_id": "Floor 1", "purpose": example['floor_plan']}]
            elif isinstance(example['floor_plan'], dict):
                example['floor_plan'] = [example['floor_plan']]
            else:
                example['floor_plan'] = []

        # 创建一个新列表来保存处理后的楼层计划
        processed_floors = []
        
        # 处理每个元素
        for i, floor in enumerate(example['floor_plan']):
            # 如果元素不是字典，创建一个新字典
            if not isinstance(floor, dict):
                processed_floor = {"floor_id": f"Floor {i+1}", "purpose": str(floor)}
            else:
                # 创建原始字典的深拷贝
                processed_floor = copy.deepcopy(floor)
                
                # 添加必要字段
                if 'floor_id' not in processed_floor:
                    processed_floor['floor_id'] = f"Floor {i+1}"
                if 'purpose' not in processed_floor:
                    processed_floor['purpose'] = ""
            
            processed_floors.append(processed_floor)
        
        # 用处理后的列表替换原始列表
        example['floor_plan'] = processed_floors

        async def process_floor(floor):
            # 不再需要检查floor是否为字典
            floor_id = floor.get('floor_id', "Unknown Floor")
            purpose = floor.get('purpose', "")
            
            # 确保purpose是字符串
            if not isinstance(purpose, str):
                if isinstance(purpose, list):
                    purpose = ", ".join([str(p) for p in purpose])
                else:
                    purpose = str(purpose)
            
            prompt = f"""You are an expert disigner. 
    Write a 150-word skyscraper floor plan for the floor of {floor_id}.
    The purpose for this floor is: {purpose}
    You should consider the coherence of the floor plan by referring to the plan of the whole skyscraper:
    {example['floor_plan']}

    You should consider the user requirements: {example['prompt']}
    Check from the user requirements if there are any special requirement that should be included in the floor plan. If there are, include them in the floor plan. If there are no special events, write a general floor plan.
    Return the floor plan for the floor of {floor_id} in the following json format:
    {{
        "floor_id": "{floor_id}",
        "check": "reason and check if the user requirements are met",
        "plan": "Your 150-word floor plan here" 
    }}
    """
            logging.info(f"Generating initial floor plan for floor {floor_id}")

            # 最多尝试3次获取有效响应
            max_attempts = 3
            for attempt in range(max_attempts):
                try:
                    async with semaphore:
                        response = await async_call_llm(model, prompt)
                    
                    # repair the json string
                    response = repair_json(response)

                    # 寻找JSON对象
                    match = re.search(r"\{.*\}", response, re.DOTALL)
                    if match:
                        json_str = match.group(0)
                        
                        try:
                            floor_plan = json.loads(json_str)
                            
                            # 检查必要的键是否存在
                            if 'plan' in floor_plan:
                                floor['plan'] = floor_plan['plan']
                                # 确保plan是字符串
                                if not isinstance(floor['plan'], str):
                                    floor['plan'] = str(floor['plan'])
                            elif 'floor_plan' in floor_plan:
                                floor['plan'] = floor_plan['floor_plan']
                                if not isinstance(floor['plan'], str):
                                    floor['plan'] = str(floor['plan'])
                            elif 'design' in floor_plan:
                                floor['plan'] = floor_plan['design']
                                if not isinstance(floor['plan'], str):
                                    floor['plan'] = str(floor['plan'])
                            else:
                                # 如果没有找到任何预期的键，从整个响应中提取内容
                                content = re.sub(r'[\{\}"\'floor_id[^:]*:|check[^:]*:|\s*]', '', json_str)
                                floor['plan'] = content.strip()
                                if not isinstance(floor['plan'], str):
                                    floor['plan'] = str(floor['plan'])
                        except json.JSONDecodeError as e:
                            logging.error(f"JSON decode error for {floor_id}: {e}, attempt {attempt+1}/{max_attempts}")
                            if attempt == max_attempts - 1:
                                # 最后一次尝试，使用原始响应
                                floor['plan'] = f"Skyscraper floor plan for {floor_id} with purpose: {purpose}"
                                floor['length_requirement'] = 150
                    else:
                        # 如果没有找到JSON，使用整个响应
                        logging.warning(f"No JSON found in response for {floor_id}, attempt {attempt+1}/{max_attempts}")
                        if attempt == max_attempts - 1:
                            floor['plan'] = response.strip() or f"Skyscraper floor plan for {floor_id} with purpose: {purpose}"
                            floor['length_requirement'] = 150
                except Exception as e:
                    logging.error(f"Error processing floor for {floor_id}: {e}, attempt {attempt+1}/{max_attempts}")
                    if attempt == max_attempts - 1:
                        floor['plan'] = f"Skyscraper floor plan for {floor_id} with purpose: {purpose}"
                        floor['length_requirement'] = 150

            # 确保plan字段存在
            if 'plan' not in floor:
                floor['plan'] = f"Skyscraper floor plan for {floor_id} with purpose: {purpose}"
                floor['length_requirement'] = 150
                logging.warning(f"Created fallback floor plan for {floor_id}")

            # Refine the floor plan
            try:
                current_length = count_words(floor['plan'])
                required_length = floor['length_requirement']

                word_diff = abs(required_length - current_length)

                # 只有当差距超过10%时才进行微调
                if word_diff > (required_length * 0.1):
                    refinement_prompt = f"""You are an expert editor. The provided text need to be {"shorten" if current_length > required_length else "lengthen"} by {word_diff} words while maintaining the original meaning and coherence.
                    Text:
                    {floor['plan']}
                    Return only the refined text."""

                    logging.info(f"Refining text for floor {floor_id}")
                    async with semaphore:
                        refined_text = await async_call_llm(model, refinement_prompt)
                    
                    if refined_text and len(refined_text) > 10:
                        floor['plan'] = refined_text.strip()
                        logging.info(f"Refined text: {floor['plan'][:50]}...")
                    
                    current_length = count_words(floor['plan'])
                    logging.info(f"Final floor plan word count: {current_length}")
            except Exception as e:
                logging.error(f"Error during refinement for {floor_id}: {e}")
            
            return floor

        # Process all floors concurrently
        tasks = [process_floor(floor) for floor in example['floor_plan']]
        
        try:
            processed_results = await asyncio.gather(*tasks)
            example['floor_plan'] = processed_results
        except Exception as e:
            logging.error(f"Error during concurrent floor processing: {e}")
            # 确保至少有一些结果
            processed_results = []
            for floor in example['floor_plan']:
                try:
                    if 'plan' not in floor:
                        floor['plan'] = f"Floor plan for {floor.get('floor_id', 'Unknown Floor')}"
                        floor['length_requirement'] = 150
                    processed_results.append(floor)
                except Exception as inner_e:
                    logging.error(f"Error processing individual floor: {inner_e}")
                    # 添加一个默认的楼层计划以保持结构完整
                    processed_results.append({
                        "floor_id": "Unknown Floor",
                        "plan": "Skyscraper floor plan placeholder.",
                        "length_requirement": 150
                    })
            
            example['floor_plan'] = processed_results

        example['final_text'] = GenerationAgent.get_final_floor_text(example['floor_plan'])

        return example

 
    @staticmethod
    def get_final_floor_text(floor_plan):
        """
        Get the final text from the generated text with respect to the plan.
        """
        text = ""

        for floor in floor_plan:
            if isinstance(floor, dict):
                floor_id = str(floor.get('floor_id', "Unknown Floor"))
                # 确保plan是字符串
                plan_text = floor.get('plan', "")
                if not isinstance(plan_text, str):
                    plan_text = str(plan_text)
                text += '#*# ' + floor_id + ':' + plan_text
            else:
                # 简单转为字符串
                text += '#*# Unknown Floor:' + str(floor)

        text += '*** finished'
        return text
    
    @staticmethod
    async def async_generate_menu(model, example, semaphore):
        # 确保 weekly_plan 是列表
        if 'weekly_plan' not in example or not example['weekly_plan']:
            example['weekly_plan'] = []
        elif not isinstance(example['weekly_plan'], list):
            if isinstance(example['weekly_plan'], str):
                example['weekly_plan'] = [{"week_id": "Week 1", "dishes": example['weekly_plan']}]
            elif isinstance(example['weekly_plan'], dict):
                example['weekly_plan'] = [example['weekly_plan']]
            else:
                example['weekly_plan'] = []

        # 创建一个新列表来保存处理后的菜单计划
        processed_weeks = []

        # 确保每个元素都包含必要字段
        for i, week in enumerate(example['weekly_plan']):
            # 如果元素不是字典，创建一个新字典
            if not isinstance(week, dict):
                processed_week = {"week_id": f"Menu Week {i+1}", "dishes": str(week)}
            else:
                # 创建原始字典的深拷贝
                processed_week = copy.deepcopy(week)

                # 添加必要字段
                if 'week_id' not in processed_week:
                    processed_week['week_id'] = f"Menu Week {i+1}"
                if 'dishes' not in processed_week:
                    processed_week['dishes'] = ""

            processed_weeks.append(processed_week)

        # 用处理后的列表替换原始列表
        example['weekly_plan'] = processed_weeks

        async def process_menu(week):
            # 不再需要检查 week 是否为字典，因为之前已经确保了所有元素都是字典
            week_id = week.get('week_id', "Unknown Menu Week")
            dishes = week.get('dishes', [])

            # 确保 dishes 是字符串表示
            dishes_str = ""
            if isinstance(dishes, list):
                # 处理每个 dish 项，确保都是字符串
                dishes_str = ", ".join([str(dish) for dish in dishes])
            else:
                dishes_str = str(dishes)

            prompt = f"""You are an expert chef. 
    Write a 200-word weekly menu plan for the week of {week_id}.
    The dishes for this week are: {dishes_str}
    You should consider the coherence of the menu plan referring to the plan of the whole year:
    {example['weekly_plan']}
    You should consider the user requirements: {example['prompt']}
    Check from the user requirements if there are any special dishes that should be included in the menu plan. If there are, include them in the menu plan. If there are no special dishes, write a general menu plan for the week.
    Return the menu plan in the following json format:
    {{
        "week_id": "{week_id}",
        "check": "reason and check if the user requirements are met",
        "week_menu": "Your 200-word menu plan here"
    }}
    """
            logging.info(f"Generating initial menu plan for week {week_id}")

            # 最多尝试3次获取有效响应
            max_attempts = 3
            for attempt in range(max_attempts):
                try:
                    async with semaphore:
                        response = await async_call_llm(model, prompt)

                    # 修复 JSON 字符串
                    response = repair_json(response)

                    # 寻找 JSON 对象
                    match = re.search(r"\{.*\}", response, re.DOTALL)
                    if match:
                        json_str = match.group(0)

                        try:
                            week_menu_json = json.loads(json_str)

                            # 检查必要的键是否存在
                            if 'week_menu' in week_menu_json:
                                week['week_menu'] = week_menu_json['week_menu']
                                # 确保 week_menu 是字符串
                                if not isinstance(week['week_menu'], str):
                                    week['week_menu'] = str(week['week_menu'])
                            else:
                                # 如果没有找到任何预期的键，从整个响应中提取内容
                                content = re.sub(r'[\{\}"\'week_id[^:]*:|check[^:]*:|\s*]', '', json_str)
                                week['week_menu'] = content.strip()
                                if not isinstance(week['week_menu'], str):
                                    week['week_menu'] = str(week['week_menu'])

                            week['length_requirement'] = 200
                            logging.info(f"Menu plan word count: {count_words(week['week_menu'])}")
                            break
                        except json.JSONDecodeError as e:
                            logging.error(f"JSON decode error for {week_id}: {e}, attempt {attempt+1}/{max_attempts}")
                            if attempt == max_attempts - 1:
                                # 最后一次尝试，使用原始响应
                                week['week_menu'] = f"Weekly menu for {week_id} featuring {dishes_str}"
                                week['length_requirement'] = 200
                    else:
                        # 如果没有找到 JSON，使用整个响应
                        logging.warning(f"No JSON found in response for {week_id}, attempt {attempt+1}/{max_attempts}")
                        if attempt == max_attempts - 1:
                            week['week_menu'] = response.strip() or f"Weekly menu for {week_id} featuring {dishes_str}"
                            week['length_requirement'] = 200
                except Exception as e:
                    logging.error(f"Error processing menu for {week_id}: {e}, attempt {attempt+1}/{max_attempts}")
                    if attempt == max_attempts - 1:
                        week['week_menu'] = f"Weekly menu for {week_id} featuring {dishes_str}"
                        week['length_requirement'] = 200

            # 确保 week_menu 字段存在
            if 'week_menu' not in week:
                week['week_menu'] = f"Weekly menu for {week_id} featuring {dishes_str}"
                week['length_requirement'] = 200

            return week

        # 并发处理所有菜单周
        tasks = [process_menu(week) for week in example['weekly_plan']]

        try:
            processed_results = await asyncio.gather(*tasks)
            example['weekly_plan'] = processed_results
        except Exception as e:
            logging.error(f"Error during concurrent menu processing: {e}")
            # 确保至少有一些结果
            processed_results = []
            for week in example['weekly_plan']:
                try:
                    if 'week_menu' not in week:
                        week['week_menu'] = f"Weekly menu for {week.get('week_id', 'Unknown Week')}"
                        week['length_requirement'] = 200
                    processed_results.append(week)
                except Exception as inner_e:
                    logging.error(f"Error processing individual menu week: {inner_e}")
                    # 添加一个默认的菜单计划以保持结构完整
                    processed_results.append({
                        "week_id": "Unknown Menu Week",
                        "week_menu": "Weekly menu placeholder.",
                        "length_requirement": 200
                    })

            example['weekly_plan'] = processed_results

        example['final_text'] = GenerationAgent.get_final_menu_text(example['weekly_plan'])
        return example

    @staticmethod
    def get_final_menu_text(weekly_plan):
        """
        Get the final text from the generated text with respect to the plan.
        """
        text = ""

        for week in weekly_plan:
            if isinstance(week, dict):
                week_id = str(week.get('week_id', "Unknown Menu Week"))
                # 确保week_menu是字符串
                menu = week.get('week_menu', "")
                if not isinstance(menu, str):
                    menu = str(menu)
                text += '#*# ' + week_id + ':' + menu
            else:
                # 简单转为字符串
                text += '#*# Unknown Menu Week:' + str(week)

        text += '*** finished ***'
        return text

    @staticmethod
    async def async_generate_block(model, example, semaphore):
        # 确保 block_plan 是列表
        if 'block_plan' not in example or not example['block_plan']:
            example['block_plan'] = []
        elif not isinstance(example['block_plan'], list):
            if isinstance(example['block_plan'], str):
                example['block_plan'] = [{"block_id": "Block 1", "use": example['block_plan']}]
            elif isinstance(example['block_plan'], dict):
                example['block_plan'] = [example['block_plan']]
            else:
                example['block_plan'] = []

        # 创建一个新列表来保存处理后的区块计划
        processed_blocks = []
        
        # 处理每个元素
        for i, block in enumerate(example['block_plan']):
            # 如果元素不是字典，创建一个新字典
            if not isinstance(block, dict):
                processed_block = {"block_id": f"Block {i+1}", "use": str(block)}
            else:
                # 创建原始字典的深拷贝
                processed_block = copy.deepcopy(block)
                
                # 添加必要字段
                if 'block_id' not in processed_block:
                    processed_block['block_id'] = f"Block {i+1}"
                
                if 'use' not in processed_block:
                    # 尝试从其他字段获取信息
                    if any(processed_block.values()):
                        # 找一个有值的字段作为use
                        for key, value in processed_block.items():
                            if value and key != 'block_id':
                                processed_block['use'] = f"{key}: {value}"
                                break
                    
                    # 如果没找到或没有值，设置默认值
                    if 'use' not in processed_block:
                        processed_block['use'] = ""
            
            processed_blocks.append(processed_block)
        
        # 用处理后的列表替换原始列表
        example['block_plan'] = processed_blocks

        async def process_block(block):
            # 不再需要检查block是否为字典
            block_id = block.get('block_id', "Unknown Block")
            use = block.get('use', "")
            
            # 确保use是字符串
            if not isinstance(use, str):
                if isinstance(use, list):
                    use = ", ".join([str(item) for item in use])
                else:
                    use = str(use)
            
            prompt = f"""You are an expert disigner. 
    Write a 150-word city block plan for the block of {block_id}.
    The use for this block is: {use}
    You should consider the coherence of the block plan by referring to the plan of the whole city:
    {example['block_plan']}

    You should consider the user requirements: {example['prompt']}
    Check from the user requirements if there are any special requirement that should be included in the block plan. If there are, include them in the block plan. If there are no special events, write a general block plan.
    Return the block plan for the block of {block_id} in the following json format:
    {{
        "block_id": "{block_id}",
        "check": "reason and check if the user requirements are met",
        "plan": "Your 150-word block plan here" 
    }}
    """
            logging.info(f"Generating initial block plan for block {block_id}")

            # 最多尝试3次获取有效响应
            max_attempts = 3
            for attempt in range(max_attempts):
                try:
                    async with semaphore:
                        response = await async_call_llm(model, prompt)
                    
                    # repair the json string
                    response = repair_json(response)

                    # 寻找JSON对象
                    match = re.search(r"\{.*\}", response, re.DOTALL)
                    if match:
                        json_str = match.group(0)
                        
                        try:
                            block_plan = json.loads(json_str)
                            
                            # 检查必要的键是否存在
                            if 'plan' in block_plan:
                                block['plan'] = block_plan['plan']
                                # 确保plan是字符串
                                if not isinstance(block['plan'], str):
                                    block['plan'] = str(block['plan'])
                            elif 'design' in block_plan:
                                # 尝试使用替代键
                                block['plan'] = block_plan['design']
                                if not isinstance(block['plan'], str):
                                    block['plan'] = str(block['plan'])
                            elif 'block_plan' in block_plan:
                                block['plan'] = block_plan['block_plan']
                                if not isinstance(block['plan'], str):
                                    block['plan'] = str(block['plan'])
                            else:
                                # 如果没有找到任何预期的键，从整个响应中提取内容
                                content = re.sub(r'[\{\}"\'block_id[^:]*:|check[^:]*:|\s*]', '', json_str)
                                block['plan'] = content.strip()
                                if not isinstance(block['plan'], str):
                                    block['plan'] = str(block['plan'])
                                
                            block['length_requirement'] = 150
                            logging.info(f"Block plan word count: {count_words(block['plan'])}")
                            break
                        except json.JSONDecodeError as e:
                            logging.error(f"JSON decode error for {block_id}: {e}, attempt {attempt+1}/{max_attempts}")
                            if attempt == max_attempts - 1:
                                # 最后一次尝试，使用原始响应
                                block['plan'] = f"City block plan for {block_id} with use: {use}"
                                block['length_requirement'] = 150
                    else:
                        # 如果没有找到JSON，使用整个响应
                        logging.warning(f"No JSON found in response for {block_id}, attempt {attempt+1}/{max_attempts}")
                        if attempt == max_attempts - 1:
                            block['plan'] = response.strip() or f"City block plan for {block_id} with use: {use}"
                            block['length_requirement'] = 150
                except Exception as e:
                    logging.error(f"Error processing block plan for {block_id}: {e}, attempt {attempt+1}/{max_attempts}")
                    if attempt == max_attempts - 1:
                        block['plan'] = f"City block plan for {block_id} with use: {use}"
                        block['length_requirement'] = 150

            # 确保plan字段存在
            if 'plan' not in block:
                block['plan'] = f"City block plan for {block_id} with use: {use}"
                block['length_requirement'] = 150
                logging.warning(f"Created fallback block plan for {block_id}")

            # Refine the block plan
            try:
                current_length = count_words(block['plan'])
                required_length = block['length_requirement']

                word_diff = abs(required_length - current_length)

                # 只有当差距超过10%时才进行微调
                if word_diff > (required_length * 0.1):
                    refinement_prompt = f"""You are an expert editor. The provided text need to be {"shorten" if current_length > required_length else "lengthen"} by {word_diff} words while maintaining the original meaning and coherence.
                    Text:
                    {block['plan']}
                    Return only the refined text."""

                    logging.info(f"Refining text for block {block_id}")
                    async with semaphore:
                        refined_text = await async_call_llm(model, refinement_prompt)
                    
                    if refined_text and len(refined_text) > 10:
                        block['plan'] = refined_text.strip()
                        logging.info(f"Refined text: {block['plan'][:50]}...")
                    
                    current_length = count_words(block['plan'])
                    logging.info(f"Final block plan word count: {current_length}")
            except Exception as e:
                logging.error(f"Error during refinement for {block_id}: {e}")

            return block

        # Process all blocks concurrently
        tasks = [process_block(block) for block in example['block_plan']]
        
        try:
            processed_results = await asyncio.gather(*tasks)
            example['block_plan'] = processed_results
        except Exception as e:
            logging.error(f"Error during concurrent block processing: {e}")
            # 确保至少有一些结果
            processed_results = []
            for block in example['block_plan']:
                try:
                    if 'plan' not in block:
                        block['plan'] = f"Block plan for {block.get('block_id', 'Unknown Block')}"
                        block['length_requirement'] = 150
                    processed_results.append(block)
                except Exception as inner_e:
                    logging.error(f"Error processing individual block: {inner_e}")
                    # 添加一个默认的区块计划以保持结构完整
                    processed_results.append({
                        "block_id": "Unknown Block",
                        "plan": "City block plan placeholder.",
                        "length_requirement": 150
                    })
            
            example['block_plan'] = processed_results

        example['final_text'] = GenerationAgent.get_final_block_text(example['block_plan'])

        return example

    @staticmethod
    def get_final_block_text(block_plan):
        """
        Get the final text from the generated text with respect to the plan.
        """
        text = ""

        for block in block_plan:
            if isinstance(block, dict):
                block_id = str(block.get('block_id', "Unknown Block"))
                # 确保plan是字符串
                plan_text = block.get('plan', "")
                if not isinstance(plan_text, str):
                    plan_text = str(plan_text)
                text += '#*# ' + block_id + ':' + plan_text
            else:
                # 简单转为字符串
                text += '#*# Unknown Block:' + str(block)

        text += '*** finished'
        return text