from pathlib import Path
import sys
# Add project root to sys.path
sys.path.append(str(Path(__file__).resolve().parents[1]))

import json
from typing import List, Optional, Dict, Any
from datetime import datetime
import re
from schema import ExpertFeedbackPack, ExpertFeedbackItem, FeedbackSource


class ExpertFeedbackStore:
    """专家反馈持久化存储。
    默认存放在 ./knowledgeBase/experience_library.json
    """

    def __init__(self, storage_path: str = "knowledgeBase/experience_library.json"):
        self.storage_path = storage_path
        Path("knowledgeBase").mkdir(parents=True, exist_ok=True)
        
        # 如果存储文件不存在，尝试加载外部默认知识库
        if not Path(self.storage_path).exists():
            default_external = "knowledgeBase/external_knowledge.json"
            if Path(default_external).exists():
                # 避免循环调用，先创建一个空文件
                self.save(ExpertFeedbackPack(items=[]))
                self.load_external_knowledge(default_external)

    def load(self) -> ExpertFeedbackPack:
        p = Path(self.storage_path)
        if not p.exists():
            return ExpertFeedbackPack(items=[])
        data = json.loads(p.read_text(encoding="utf-8"))
        return ExpertFeedbackPack(**data)

    def save(self, pack: ExpertFeedbackPack) -> None:
        p = Path(self.storage_path)
        p.write_text(pack.model_dump_json(indent=2), encoding="utf-8")

    def add_feedback(self, item: ExpertFeedbackItem) -> None:
        pack = self.load()
        pack.items.append(item)
        self.save(pack)

    # ---- 输入规范化辅助 ----
    def _normalize_condition(self, condition: Optional[Any]) -> Optional[Dict[str, Any]]:
        """将 condition 规范为字典。支持 str(JSON/普通文本)、dict、其他类型。"""
        if condition is None:
            return None
        if isinstance(condition, dict):
            return condition
        if isinstance(condition, str):
            s = condition.strip()
            if not s:
                return None
            # 尝试解析为 JSON 对象
            try:
                parsed = json.loads(s)
                if isinstance(parsed, dict):
                    return parsed
            except Exception:
                pass
            return {"note": s}
        # 其他类型统一转字符串放入 note
        return {"note": str(condition)}

    def _normalize_tags(self, tags: Optional[Any]) -> List[str]:
        """将 tags 规范为字符串列表。支持 str(JSON/逗号分隔)、list、其他类型。"""
        if tags is None:
            return []
        if isinstance(tags, list):
            return [str(t).strip() for t in tags if str(t).strip()]
        if isinstance(tags, str):
            s = tags.strip()
            if not s:
                return []
            # 优先尝试 JSON 列表
            try:
                parsed = json.loads(s)
                if isinstance(parsed, list):
                    return [str(t).strip() for t in parsed if str(t).strip()]
            except Exception:
                pass
            # 其次按逗号分隔
            if "," in s:
                return [part.strip() for part in s.split(",") if part.strip()]
            return [s]
        # 其他类型
        return [str(tags)]


    def query(self, task_type: Optional[str] = None, condition_contains: Optional[Dict[str, Any]] = None, 
              source: Optional[FeedbackSource] = None, tags: Optional[List[str]] = None) -> List[ExpertFeedbackItem]:
        """按任务类型与条件子集检索反馈。condition_contains 所有键值需被包含。"""
        pack = self.load()
        result: List[ExpertFeedbackItem] = []
        for it in pack.items:
            if task_type and it.task_type != task_type:
                continue
            if condition_contains:
                cond = it.condition or {}
                ok = all(k in cond and cond[k] == v for k, v in condition_contains.items())
                if not ok:
                    continue
            if source and it.source != source:
                continue
            if tags and not any(tag in it.tags for tag in tags):
                continue
            result.append(it)
        return result

    def add_success_case_feedback(self, case_id: str, task_type: str, recommendation: str, anti_pattern: str,
                                 rationale: str, condition: Optional[Dict[str, Any]] = None,
                                 tags: Optional[List[str]] = None) -> None:
        """从成功案例库添加反馈"""
        item = ExpertFeedbackItem(
            task_type=task_type,
            condition=self._normalize_condition(condition),
            recommendation=recommendation,
            anti_pattern=anti_pattern,
            rationale=rationale,
            score=0.8,  # 默认成功案例经验置信度较高
            source=FeedbackSource.SUCCESS_CASE,
            source_id=case_id,
            created_by="system",
            created_at=datetime.now().isoformat(),
            tags=self._normalize_tags(tags)
        )
        self.add_feedback(item)

    def add_external_knowledge_feedback(self, doc_id: str, task_type: str, recommendation: str,anti_pattern: str,
                                       rationale: str, condition: Optional[Dict[str, Any]] = None,
                                       tags: Optional[List[str]] = None) -> None:
        """从外部知识库添加反馈"""
        item = ExpertFeedbackItem(
            task_type=task_type,
            condition=self._normalize_condition(condition),
            recommendation=recommendation,
            anti_pattern=anti_pattern,
            score=0.8,  # 默认外部经验经验置信度较高
            rationale=rationale,
            source=FeedbackSource.EXTERNAL_KNOWLEDGE,
            source_id=doc_id,
            created_by="external_knowledge",
            created_at=datetime.now().isoformat(),
            tags=self._normalize_tags(tags)
        )
        self.add_feedback(item)

    def add_human_feedback(self, user_id: str, task_type: str, recommendation: str,anti_pattern: str,
                          rationale: str, condition: Optional[Dict[str, Any]] = None,
                          tags: Optional[List[str]] = None, score: Optional[float] = None) -> None:
        """从人机交互添加反馈"""
        item = ExpertFeedbackItem(
            task_type=task_type,
            condition=self._normalize_condition(condition),
            recommendation=recommendation,
            anti_pattern=anti_pattern,
            rationale=rationale,
            score=score,
            source=FeedbackSource.HUMAN_INTERACTION,
            source_id=f"human_{user_id}_{datetime.now().strftime('%Y%m%d_%H%M%S')}",
            created_by=user_id,
            created_at=datetime.now().isoformat(),
            tags=self._normalize_tags(tags)
        )
        self.add_feedback(item)

    def extract_from_success_case(self, case_path: str, task_type: Optional[str] = None) -> None:
        """使用大模型从成功案例中智能提取经验
        Args:
            case_path: 案例文件路径 (plan.json)
            task_type: 可选，指定只提取某个任务类型的经验；若为 None，则提取所有成功任务的经验
        """
        import logger
        from prompt.knowledge import EXTRACT_EXPERIENCE_SYSTEM_PROMPT, EXTRACT_EXPERIENCE_USER_PROMPT
        from llm import LLM
        from utils import parse_res,remove_code_recursive
        try:
            logger.info(f"[经验提取] 读取案例文件: {case_path}")
            case_data = json.loads(Path(case_path).read_text(encoding="utf-8"))
            remove_code_recursive(case_data, field_name="code")  # 移除代码字段
            is_success= case_data.get("current_task","").get("task_result","").get("is_success")
            # 构造 prompt
            user_prompt = EXTRACT_EXPERIENCE_USER_PROMPT + "\n\n" + "# 以下是本次任务执行过程：\n" + str(case_data)

            llm = LLM()
            messages = [
                {"role": "system", "content": EXTRACT_EXPERIENCE_SYSTEM_PROMPT},
                {"role": "user", "content": user_prompt}
            ]
            response = llm.ask(messages)
            try:
                feedbacks = json.loads(parse_res(response))
                logger.debug(f"[经验提取] LLM解析后输出: {feedbacks}")
            except Exception as e:
                logger.error(f"[经验提取] LLM输出解析失败: {e}\n原始内容: {response.choices[0].message.content[:500]}")
                return

            # 保存经验
            count = 0
            for fb in feedbacks:
                if isinstance(fb, dict) and "recommendation" in fb and "rationale" in fb:
                    # 规范化字段，避免 Pydantic 校验错误
                    norm_condition = self._normalize_condition(fb.get("condition"))
                    norm_tags = self._normalize_tags(fb.get("tags", ["auto_extracted", "success_case"]))
                    if not norm_tags:
                        norm_tags = ["auto_extracted", "success_case"]
                    self.add_success_case_feedback(
                        case_id=Path(case_path).stem,
                        task_type=str(fb.get("task_type", "其他")),
                        recommendation=fb["recommendation"],
                        anti_pattern=fb.get("anti_pattern",""),
                        rationale=fb["rationale"],
                        condition=norm_condition,
                        tags=norm_tags
                    )
                    logger.info(f"[经验提取] 已保存经验: {fb.get('task_type', '其他')} | {fb['recommendation']}")
                    count += 1
                else:
                    logger.warning(f"[经验提取] 跳过格式不完整的经验: {fb}")
            logger.success(f"[经验提取] 共保存 {count} 条经验建议。")
        except Exception as e:
            logger.error(f"[经验提取] 提取失败: {e}")
            import traceback
            traceback.print_exc()
     

    def load_external_knowledge(self, knowledge_file: str) -> None:
        """从外部知识库文件加载经验"""
        try:
            with open(knowledge_file, 'r', encoding='utf-8') as f:
                knowledge_data = json.load(f)
            
            for item_data in knowledge_data.get("feedback_items", []):
                self.add_external_knowledge_feedback(
                    doc_id=item_data.get("source_id", "external_doc"),
                    task_type=item_data["task_type"],
                    recommendation=item_data["recommendation"],
                    anti_pattern=item_data.get("anti_pattern",""),
                    rationale=item_data.get("rationale", ""),
                    condition=item_data.get("condition"),
                    tags=item_data.get("tags", [])
                )
        except Exception as e:
            print(f"加载外部知识库失败: {e}")

    def get_feedback_summary(self) -> Dict[str, Any]:
        """获取反馈统计摘要"""
        pack = self.load()
        summary = {
            "total_items": len(pack.items),
            "by_source": {},
            "by_task_type": {}
        }
        
        for item in pack.items:
            # 按来源统计
            source = item.source.value
            summary["by_source"][source] = summary["by_source"].get(source, 0) + 1
            
            # 按任务类型统计
            task_type = item.task_type
            summary["by_task_type"][task_type] = summary["by_task_type"].get(task_type, 0) + 1
            
            # no score-based statistics (score field removed)
        
        return summary

if __name__ == "__main__":
    import logger
    import globals
    logger.init()
    expertFeedbackStore=ExpertFeedbackStore()
    expertFeedbackStore.extract_from_success_case(case_path="output/results/test_mlebench_plant-pathology-2020-fgvc7_20251223100639/plan.json", task_type=None)

