from functools import total_ordering
from typing import List, Dict, Optional, Any, Literal, Tuple, Union
from enum import Enum
from datetime import datetime, timezone, timedelta
from pydantic import BaseModel, ConfigDict, Field, field_validator
import uuid
from src.utils.string_utils import trim_long_string
import math
import logging
from src.models.agent_models import ActionType
logger = logging.getLogger(__name__)

class NoteType(str, Enum):
    API = "api"
    CODE_EXAMPLE = "code-example"
    EXPERIENCE = "experience"

class ExperienceType(str,Enum):
    General = "General"
    OperatorSpecific = "Operator-Specific"

class ExperienceSource(str,Enum):
    BASIC_FAILURE = "BasicFailure"  # Errors caused by inability to write code
    DRAFT_SUCCESS = "DraftSuccess" # Successfully wrote code
    DEBUG_SUCCESS = "DebugSuccess" # Successfully modified code
    OPTIMIZE_FAILURE = "OptimizeFailure" # Errors caused by inability to optimize
    OPTIMIZE_SUCCESS = "OptimizeSuccess" # Successfully optimized code
    BEST_PRACTICE = "BestPractice" # Best practices

@total_ordering 
class BaseMemoryNote(BaseModel):
    """A memory note representing a single unit of information in the memory system."""
    model_config = ConfigDict(extra='forbid', populate_by_name=True)
    
    id: str = Field(default_factory=lambda: str(uuid.uuid4()), description="Unique identifier")
    memory: Optional[str] = Field(default=None, alias="memory", description="Main text content")
    note_type: str = "unknown"
    score: Optional[float] = Field(default=0.0, description="Similarity score of the note")

    created_at: datetime = Field(default_factory=lambda: datetime.now(timezone.utc))
    last_accessed_at: datetime = Field(default_factory=lambda: datetime.now(timezone.utc))
    retrieval_count: int = Field(default=0, description="Number of times this memory was retrieved")


    # RL metadata (no-op when value-driven memory is disabled)
    # Draft stage Q values
    draft_q_value: Optional[float] = Field(default=0.0, description="Learned Q value for RL selection in draft stage")
    draft_q_visits: int = Field(default=0, description="Number of times this memory participated in Q updates in draft stage")
    draft_reward_ma: Optional[float] = Field(default=0.0, description="Exponential moving average of rewards in draft stage")
    draft_last_reward: Optional[float] = Field(default=0.0, description="Reward received for the last usage in draft stage")
    draft_q_updated_at: Optional[datetime] = Field(default=None, description="Timestamp of last Q value update in draft stage")
    
    # Optimize stage Q values
    optimize_q_value: Optional[float] = Field(default=0.0, description="Learned Q value for RL selection in optimize stage")
    optimize_q_visits: int = Field(default=0, description="Number of times this memory participated in Q updates in optimize stage")
    optimize_reward_ma: Optional[float] = Field(default=0.0, description="Exponential moving average of rewards in optimize stage")
    optimize_last_reward: Optional[float] = Field(default=0.0, description="Reward received for the last usage in optimize stage")
    optimize_q_updated_at: Optional[datetime] = Field(default=None, description="Timestamp of last Q value update in optimize stage")
    
    # Legacy fields for backward compatibility (deprecated, use stage-specific fields instead)
    q_value: Optional[float] = Field(default=0.0, description="[DEPRECATED] Use draft_q_value or optimize_q_value instead")
    q_visits: int = Field(default=0, description="[DEPRECATED] Use draft_q_visits or optimize_q_visits instead")
    reward_ma: Optional[float] = Field(default=0.0, description="[DEPRECATED] Use draft_reward_ma or optimize_reward_ma instead")
    last_reward: Optional[float] = Field(default=0.0, description="[DEPRECATED] Use draft_last_reward or optimize_last_reward instead")
    q_updated_at: Optional[datetime] = Field(default=None, description="[DEPRECATED] Use draft_q_updated_at or optimize_q_updated_at instead")

    @field_validator('score', mode='before')
    @classmethod
    def _round_score(cls, v: Optional[float]) -> Optional[float]:
        """Round score to 6 decimal places."""
        if v is None:
            return None
        return round(float(v), 6) if math.isfinite(v) else v

    @field_validator('draft_q_value', 'optimize_q_value', 'q_value', mode='before')
    @classmethod
    def _round_q_value(cls, v: Optional[float]) -> Optional[float]:
        """Round q_value to 6 decimal places."""
        if v is None:
            return None
        return round(float(v), 6) if math.isfinite(v) else v

    @field_validator('draft_reward_ma', 'optimize_reward_ma', 'reward_ma', mode='before')
    @classmethod
    def _round_reward_ma(cls, v: Optional[float]) -> Optional[float]:
        """Round reward_ma to 6 decimal places."""
        if v is None:
            return None
        return round(float(v), 6) if math.isfinite(v) else v

    def update_state(self):
        self.retrieval_count += 1
        self.last_accessed_at = datetime.now(timezone.utc)
    
    def model_dump(self, *, exclude: Optional[List[str]] = None, **kwargs) -> Dict[str, Any]:
        """Dump model to dictionary, excluding 'id' and 'score' by default."""
        exclude_set = set(exclude or ())
        exclude_set |= {'id', 'score'}
        return super().model_dump(exclude=exclude_set, **kwargs)
    
    # ---------------------------
    # Q value accessors by stage
    # ---------------------------
    def _get_q_fields(self, stage: ActionType) -> Dict[str, str]:
        """Get the field names for Q values based on stage.
        
        Args:
            stage: Stage identifier, can be ActionType.DRAFT or ActionType.OPTIMIZE
            
        Returns:
            Dictionary mapping generic names to stage-specific field names
        """
        if stage == ActionType.DRAFT:
            return {
                'q_value': 'draft_q_value',
                'q_visits': 'draft_q_visits',
                'reward_ma': 'draft_reward_ma',
                'last_reward': 'draft_last_reward',
                'q_updated_at': 'draft_q_updated_at',
            }
        elif stage == ActionType.OPTIMIZE:
            return {
                'q_value': 'optimize_q_value',
                'q_visits': 'optimize_q_visits',
                'reward_ma': 'optimize_reward_ma',
                'last_reward': 'optimize_last_reward',
                'q_updated_at': 'optimize_q_updated_at',
            }
        else:
            raise ValueError(f"Unknown stage: {stage}. Must be {ActionType.DRAFT} or {ActionType.OPTIMIZE}")
    
    def get_q_value(self, stage: ActionType) -> Optional[float]:
        """Get Q value for a specific stage."""
        fields = self._get_q_fields(stage)
        return getattr(self, fields['q_value'])
    
    def get_reward_ma(self, stage: ActionType) -> Optional[float]:
        """Get reward moving average for a specific stage."""
        fields = self._get_q_fields(stage)
        return getattr(self, fields['reward_ma'])
        
    # ---------------------------
    # Q update
    # ---------------------------
    def update_q(
        self,
        *,
        reward: Optional[float],
        stage: ActionType,
        alpha: float = 0.1,
        init_q: float = 0.0,
        reward_ma_beta: float = 0.1,
        clip_error: Optional[float] = None,
        alpha_decay: Literal["none", "inv_sqrt", "inv"] = "none",
        now: Optional[datetime] = None,
    ) -> Dict[str, Any]:
        """
        Bandit-style update (no next state, no future return):
            Q <- Q + alpha * (reward - Q)

        Args:
            reward: Reward value for this update
            stage: Stage identifier (ActionType.DRAFT or ActionType.OPTIMIZE)
            alpha: Learning rate
            init_q: Initial Q value if Q is not initialized
            reward_ma_beta: Beta parameter for reward moving average
            clip_error: Optional error clipping value
            alpha_decay: Alpha decay strategy ("none", "inv_sqrt", or "inv")
            now: Current timestamp (defaults to now)

        alpha_decay:
          - "none":     constant alpha
          - "inv_sqrt": alpha / sqrt(1 + q_visits)
          - "inv":      alpha / (1 + q_visits)

        Returns debug info: reward, error, used_alpha, new_q, q_visits
        """

        # ---- validate ----
        if not (0.0 < alpha <= 1.0):
            raise ValueError(f"alpha must be in (0,1], got {alpha}")
        if not (0.0 <= reward_ma_beta <= 1.0):
            raise ValueError(f"reward_ma_beta must be in [0,1], got {reward_ma_beta}")
        
        t = now or datetime.now(timezone.utc)
        
        # Get stage-specific field names
        fields = self._get_q_fields(stage)
        
        # Get current Q value for this stage
        current_q_value = getattr(self, fields['q_value'])
        current_q_visits = getattr(self, fields['q_visits'])
        current_reward_ma = getattr(self, fields['reward_ma'])

        # ---- init Q if needed ----
        if current_q_value is None or not math.isfinite(current_q_value):
            new_q_value = round(float(init_q), 6) if math.isfinite(init_q) else float(init_q)
            setattr(self, fields['q_value'], new_q_value)
            current_q_value = new_q_value

        # ---- possibly decay alpha by visits (stabilizes noisy rewards) ----
        used_alpha = float(alpha)
        v = max(0, int(current_q_visits))
        if alpha_decay == "inv_sqrt":
            used_alpha = used_alpha / math.sqrt(1.0 + v)
        elif alpha_decay == "inv":
            used_alpha = used_alpha / (1.0 + v)
        
        # ---- error and optional clipping ----
        error = reward - float(current_q_value)
        if clip_error is not None:
            c = float(clip_error)
            if c < 0:
                raise ValueError("clip_error must be >= 0")
            error = max(-c, min(c, error)) # clip error to [-c, c]
        
        # ---- update value ----
        new_q = float(current_q_value) + used_alpha * error # Q <- Q + alpha * (reward - Q)
        new_q_value = round(new_q, 6) if math.isfinite(new_q) else new_q
        setattr(self, fields['q_value'], new_q_value)

        # ---- metadata ----
        setattr(self, fields['q_visits'], current_q_visits + 1)
        setattr(self, fields['last_reward'], float(reward))
        setattr(self, fields['q_updated_at'], t)

        if current_reward_ma is None or not math.isfinite(current_reward_ma):
            new_reward_ma = round(float(reward), 6) if reward is not None and math.isfinite(reward) else float(reward)
            setattr(self, fields['reward_ma'], new_reward_ma)
        else:
            new_reward_ma = (1.0 - reward_ma_beta) * float(current_reward_ma) + reward_ma_beta * float(reward)
            new_reward_ma = round(new_reward_ma, 6) if math.isfinite(new_reward_ma) else new_reward_ma
            setattr(self, fields['reward_ma'], new_reward_ma)

        return {
            "reward": float(reward),
            "error": round(float(error), 6) if math.isfinite(error) else float(error),
            "used_alpha": round(float(used_alpha), 6) if math.isfinite(used_alpha) else float(used_alpha),
            "new_q": float(new_q_value),  # Already rounded to 6 decimal places
            "new_q_visits": int(current_q_visits + 1),
        }

    def sort_key(self, stage: Optional[ActionType] = None) -> Tuple[Any, ...]:
        """
        Sort priority (from high to low):
        1) q_value (larger is better)
        2) reward_ma (larger is better)
        3) score (similarity, larger is better)
        4) created_at (time: newer is better)

        Args:
            stage: Optional stage identifier (ActionType.DRAFT or ActionType.OPTIMIZE). 
                   If None, uses draft_q_value and draft_reward_ma by default.
        """

        if stage is not None:
            # Use stage-specific Q values
            fields = self._get_q_fields(stage)
            q = getattr(self, fields['q_value'])
            rma = getattr(self, fields['reward_ma'])
        else:
            # Default to draft Q values for backward compatibility
            q = self.draft_q_value
            rma = self.draft_reward_ma
        
        if q is None or not math.isfinite(q):
            q = float("0.0")

        if rma is None or not math.isfinite(rma):
            rma = float("0.0")

        sim = self.score
        if sim is None or not math.isfinite(sim):
            sim = float("-inf")
        else:
            sim = round(float(sim), 4) if math.isfinite(sim) else float(sim)
        
        # Safely get timestamp
        try:
            created_at_value = getattr(self, 'created_at', None)
            if isinstance(created_at_value, datetime):
                ts = created_at_value.timestamp()
            else:
                # If created_at is not a datetime type, use default timestamp
                ts = datetime(1970, 1, 1, tzinfo=timezone.utc).timestamp()

        except (AttributeError, TypeError):
            # If accessing created_at fails, use default timestamp
            ts = datetime(1970, 1, 1, tzinfo=timezone.utc).timestamp()
            logger.info(f"created_at access error, use default timestamp: {ts}")
        
        return (q, rma, sim, ts)

    def similarity_sort_key(self) -> Tuple[Any, ...]:
        """
        Sort priority (from high to low):
        1) score (similarity, larger is better)
        2) created_at (time: newer is better)
        """
        sim = self.score
        if sim is None or not math.isfinite(sim):
            sim = float("-inf")
        else:
            sim = round(float(sim), 4) if math.isfinite(sim) else float(sim)
        try:
            created_at_value = getattr(self, 'created_at', None)
            if isinstance(created_at_value, datetime):
                ts = created_at_value.timestamp()
            else:
                # If created_at is not a datetime type, use default timestamp
                ts = datetime(1970, 1, 1, tzinfo=timezone.utc).timestamp()
        except (AttributeError, TypeError):
            # If accessing created_at fails, use default timestamp
            ts = datetime(1970, 1, 1, tzinfo=timezone.utc).timestamp()
            logger.info(f"created_at access error, use default timestamp: {ts}")
        return (sim, ts)
    
    def concept_drift_sort_key(
        self,
        *,
        decay_factor: float,
        recent_bonus: float,
        recent_window_days: int,
        stage: Optional[ActionType] = None,
        now: Optional[datetime] = None,
    ) -> Tuple[Any, ...]:
        """
        Calculate sort key considering concept drift.
        
        Based on the original sort key (Q value, reward_ma, score, time), add time weighting:
        1. Recent successful experiences get additional weight
        2. Newer experiences get time decay weight
        
        Args:
            decay_factor: Time decay factor, larger values give higher weight to recent experiences
            recent_bonus: Reward weight for recent successful experiences
            recent_window_days: Time window (in days) considered as "recent"
            stage: Optional stage identifier (ActionType.DRAFT or ActionType.OPTIMIZE)
            now: Current time, if None uses current UTC time
            
        Returns:
            Sort key tuple for sorting
        """
        # Get original sort key
        original_key = self.sort_key(stage=stage)
        q_val, rma_val, sim_val, ts_val = original_key
        
        # Calculate time weighting
        if now is None:
            now = datetime.now(timezone.utc)
        recent_window = timedelta(days=recent_window_days)
        
        time_weight = 0.0
        
        # Calculate time decay weight
        if isinstance(self.created_at, datetime):
            days_old = (now - self.created_at).total_seconds() / 86400.0
            # Exponential decay: exp(-decay_factor * days_old)
            # Convert to sort key (negative value, because larger is better)
            time_weight = -math.exp(-decay_factor * days_old) * 0.1
        
        # Check if it's a recent successful experience
        is_recent_success = False
        if stage is not None:
            fields = self._get_q_fields(stage)
            q_updated_at = getattr(self, fields['q_updated_at'])
            last_reward = getattr(self, fields['last_reward'])
        else:
            q_updated_at = self.draft_q_updated_at
            last_reward = self.draft_last_reward
        
        if isinstance(self.created_at, datetime) or isinstance(q_updated_at, datetime):
            update_time = q_updated_at or self.created_at
            if isinstance(update_time, datetime):
                time_since_update = now - update_time
                if time_since_update <= recent_window:
                    # Check if last reward is positive (indicating success)
                    if last_reward is not None and last_reward > 0:
                        is_recent_success = True
        
        # If it's a recent success, add reward weight (negative value, because larger is better)
        recent_success_bonus = -recent_bonus if is_recent_success else 0.0
        
        # Return modified sort key: add time weight after timestamp
        # Format: (q_value, reward_ma, score, timestamp, time_weight, recent_success_bonus)
        return (q_val, rma_val, sim_val, ts_val, time_weight, recent_success_bonus)

    def __lt__(self, other: Any) -> bool:
        if not isinstance(other, BaseMemoryNote):
            return NotImplemented
        return self.sort_key() < other.sort_key()

    def __eq__(self, other: Any) -> bool:
        if not isinstance(other, BaseMemoryNote):
            return NotImplemented
        return self.sort_key() == other.sort_key()
    

    def __repr__(self,) -> str:
        return f"""
{self.__class__.__name__}(
    id={self.id}, 
    draft_q_value={self.draft_q_value}, 
    optimize_q_value={self.optimize_q_value}, 
    score={None if self.score is None else (round(float(self.score), 4) if math.isfinite(float(self.score)) else float(self.score))},
    draft_reward_ma={self.draft_reward_ma}, 
    optimize_reward_ma={self.optimize_reward_ma},
    memory={trim_long_string(self.memory, threshold=20, k=10)}, 
    last_accessed_at={self.last_accessed_at}, 
    retrieval_count={self.retrieval_count}
)"""

    def __str__(self,) -> str:
        return self.__repr__()



class APINote(BaseMemoryNote):
    """Represents an API-related memory note with structured metadata.

    Provides common fields used when storing API documentation, examples,
    and lightweight schemas in the memory system.
    """
    note_type: str = "api"
    memory: Optional[str] = Field(None, description="Short human-readable description")

    name: str = Field(..., description="API name or identifier (e.g. aclrtMemcpy)")
    category: Optional[str] = Field(default="General", description="High-level category")
    level: Optional[str] = Field(default="General", description="High-level category")
    io_spec: Optional[str] = Field(default="General", description="High-level category")
    parameters: Optional[List[Dict]] = Field(
        default=None,
        description="parameters"
    )
    return_value: Optional[str] = Field(None, description="return_value")
    prototypes: Optional[List[Dict]] = Field(
        default=None,
        description="List of function or method prototypes",
    )
    constraints: Optional[str] = Field(None, description="constraints")
    example: Optional[str] = Field(None, description="Short example usage snippet")

    @field_validator('name')
    @classmethod
    def _normalize_name(cls, v: str) -> str:
        return str(v).strip()
    
    def __str__(self,) -> str:
        return self.__repr__()
    
    def __repr__(self,) -> str:
        return f"""
{self.__class__.__name__}(
    id={self.id}, 
    draft_q_value={self.draft_q_value}, 
    optimize_q_value={self.optimize_q_value}, 
    score={None if self.score is None else (round(float(self.score), 4) if math.isfinite(float(self.score)) else float(self.score))},
    draft_reward_ma={self.draft_reward_ma}, 
    optimize_reward_ma={self.optimize_reward_ma},
    memory={trim_long_string(self.memory, threshold=20, k=10)}, 
    last_accessed_at={self.last_accessed_at}, 
    retrieval_count={self.retrieval_count}
)"""


class CodeExampleNote(BaseMemoryNote):
    """Store example or successful code snippets and minimal metadata.

    This note holds runnable example code, small test harnesses, or working
    kernel implementations. It is searchable and can be linked to APIs or
    operators via `related_apis`.
    """

    note_type: Literal["code-example"] = "code-example"

    memory: Optional[str] = Field(
        default=None,
        description="Key or prompt for retrieving this memory (e.g., op_name + shape + dtype)",
    )

    plan: Optional[str] = Field(
        default=None,
        description="",
    )

    code: str = Field(
        ...,
        description="Source code text",
    )

    reviews: Optional[List] = Field(
        default=[],
        description="List of memory note IDs corresponding to code reviews",
    )

    is_compilable: Optional[bool] = Field(
        default=None,
        description="Whether the code can be successfully compiled/passes build (None if unknown)",
    )
    is_correct: Optional[bool] = Field(
        default=None,
        description="Whether the code is semantically and functionally correct (None if unknown or unverified)",
    )
    optimized_degree_to_parent: Optional[float] = Field(
        default=None,
        description="Optimization degree of code relative to its parent code example, larger means more optimization",
    )

    optimized_degree_to_best: Optional[float] = Field(
        default=None,
        description="Optimization degree of code relative to its best child code example, larger means more optimization",
    )

    optimized_degree_to_root: Optional[float] = Field(
        default=None,
        description="Optimization degree of code relative to its root code example, larger means more optimization",
    )

    stage: Optional[ActionType] = Field(
        default=None,
        description="Development stage of the code (e.g., 'draft', 'optimize')",
    )

    parent: Optional[str] = Field(
        default=None,
        description="ID of the parent code example (if any)",
    )

    children: Optional[List[str]] = Field(
        default=[],
        description="List of IDs of other code examples derived from this code example",
    )
    
    arc_src: Optional[str] = Field(
        default=None,
        description="ARC description or source information related to this code example (optional)",
    )

    performance: Optional[Dict[str, Any]] = Field(
        default=None,
        description="Performance-related metrics (optional), e.g., {'latency_ms': float, 'throughput': float}",
    )

    op_name: Optional[str] = Field(
        default=None,
        description="Associated operator/OP name (optional, for aggregating example code by operator)",
    )
    def sort_key_score_performance(self) -> Tuple[Any, ...]:
        """
        code-example is more sensitive to similarity, so score has higher sort priority
        Sort priority (from high to low):
        1) score (similarity, larger is better)
        2) optimized_degree_to_root (larger is better)
        3) created_at (time: newer is better)
        """
        
        if self.optimized_degree_to_root is not None and math.isfinite(self.optimized_degree_to_root):
            optimized_degree_to_root = round(float(self.optimized_degree_to_root), 4)
        else:
            optimized_degree_to_root = float("-inf")
        
        if self.created_at is not None and isinstance(self.created_at, datetime):
            created_at = self.created_at.timestamp()
        else:
            created_at = datetime(1970, 1, 1, tzinfo=timezone.utc).timestamp()
        
        return (self.score, optimized_degree_to_root, created_at)
        
    def __str__(self,) -> str:
        return self.__repr__()
    
    def __repr__(self,) -> str:
        return f"""
{self.__class__.__name__}(
    id={self.id}, 
    op_name={self.op_name},
    draft_q_value={self.draft_q_value},
    optimize_q_value={self.optimize_q_value}, 
    score={None if self.score is None else (round(float(self.score), 4) if math.isfinite(float(self.score)) else float(self.score))},
    draft_reward_ma={self.draft_reward_ma},
    optimize_reward_ma={self.optimize_reward_ma},
    last_reward={self.last_reward},
    reviews={self.reviews},
    memory={trim_long_string(self.memory, threshold=20, k=10)}, 
    last_accessed_at={self.last_accessed_at}, 
    retrieval_count={self.retrieval_count}, 
    q_updated_at={self.q_updated_at},
    stage={self.stage},
    optimized_degree_to_parent={self.optimized_degree_to_parent},
    optimized_degree_to_root={self.optimized_degree_to_root},
    optimized_degree_to_best={self.optimized_degree_to_best},
)"""

    def sort_key(self, stage: Optional[Union[str, Any]] = None) -> Tuple[Any, ...]:
        """
        code-example is more sensitive to similarity, so score has higher sort priority
        Sort priority (from high to low):
        1) score (similarity, larger is better)
        2) q_value (larger is better)
        3) reward_ma (larger is better)
        4) created_at (time: newer is better)

        Args:
            stage: Optional stage identifier ('draft' or 'optimize'). If None, defaults to 'draft'
        """

        if stage is not None:
            # Use stage-specific Q values
            fields = self._get_q_fields(stage)
            q = getattr(self, fields['q_value'])
            rma = getattr(self, fields['reward_ma'])
        else:
            # Default to draft Q values for backward compatibility
            q = self.draft_q_value
            rma = self.draft_reward_ma
        
        if q is None or not math.isfinite(q):
            q = float("0.0")

        if rma is None or not math.isfinite(rma):
            rma = float("0.0")

        sim = self.score
        if sim is None or not math.isfinite(sim):
            sim = float("-inf")
        else:
            sim = round(float(sim), 4) if math.isfinite(sim) else float(sim)
        
        try:
            created_at_value = getattr(self, 'created_at', None)
            if isinstance(created_at_value, datetime):
                ts = created_at_value.timestamp()
            else:
                ts = datetime(1970, 1, 1, tzinfo=timezone.utc).timestamp()

        except (AttributeError, TypeError):
            ts = datetime(1970, 1, 1, tzinfo=timezone.utc).timestamp()
            logger.info(f"created_at access error, use default timestamp: {ts}")
        
        return (sim, q, rma, ts)
    

class ExperienceNote(BaseMemoryNote):
    """Represents development experiences including debugging, optimization, and implementation notes.
    
    This note type captures valuable learning experiences from the development process,
    making them searchable and reusable for future similar tasks.
    """
    note_type: str = "experience"
    memory: Optional[str] = Field(None, description="Detailed description of the experience and learnings")
    experience_type: Optional[ExperienceType] = Field(None, description="Type of experience: General, Operator-Specific")
    stage: Optional[ActionType] = Field(
        default=None,
        description="Development stage of the experience (e.g., DRAFT, OPTIMIZE)",
    )   
    op_name: Optional[str] = Field(
        default=None,
        description="Associated operator/OP name (for aggregating experiences by operator)",
    )
    source: Optional[ExperienceSource] = Field(
        default=None,
        description="Source: summary of successful implementation, review of failed implementation",
    )
    content: Optional[str] = Field(
        default=None,
        description="Experience content",
    )
    abstract: Optional[str] = Field(
        default=None,
        description="Experience abstract",
    )

    @field_validator('experience_type')
    @classmethod
    def _validate_experience_type(cls, v: ExperienceType) -> ExperienceType:
        valid_types = [ExperienceType.General, ExperienceType.OperatorSpecific]
        if v not in valid_types:
            raise ValueError(f"experience_type must be one of {valid_types}, got '{v}'")
        return v
    
    def __str__(self,) -> str:
        return self.__repr__()
    
    def __repr__(self,) -> str:
        return f"""
{self.__class__.__name__}(
    id={self.id}, 
    op_name={self.op_name},
    draft_q_value={self.draft_q_value}, 
    optimize_q_value={self.optimize_q_value}, 
    score={None if self.score is None else (round(float(self.score), 4) if math.isfinite(float(self.score)) else float(self.score))},
    draft_reward_ma={self.draft_reward_ma}, 
    optimize_reward_ma={self.optimize_reward_ma},
    memory={trim_long_string(self.memory, threshold=20, k=10)}, 
    last_accessed_at={self.last_accessed_at}, 
    retrieval_count={self.retrieval_count},
    stage={self.stage},
)"""
