#!/usr/bin/env python3
"""
LLMGenerator: Use an LLM to generate geometry problems
"""

import json
import os
import re
import time
from typing import Any, Dict, Optional

from openai import OpenAI

from ..utils.symbol_translator import SymbolTranslator
from ..utils import latex_to_float


class LLMGenerator:
    """A generator that uses an LLM to create geometry problems."""
    
    def __init__(
        self,
        api_key: Optional[str] = None,
        model: Optional[str] = None,
        base_url: Optional[str] = None,
        max_retries: int = 3,
    ):
        """
        Initialize the generator.
        
        Args:
            api_key: API key (if None, read from environment variables)
            model: Model name (if None, use the default)
            base_url: API base URL (if None, use the default)
            max_retries: Maximum number of retries
        """
        # Set defaults
        if model is None:
            model = os.getenv("OPENAI_MODEL") or "gpt-4o-mini"
        if base_url is None:
            base_url = os.getenv("OPENAI_BASE_URL") or "https://api.openai.com/v1"
        
        self.api_key = api_key or os.getenv("OPENAI_API_KEY")
        
        if not self.api_key:
            raise ValueError("An API key is required (via argument or environment variable).")
        
        self.model = model
        self.base_url = base_url
        self.max_retries = max_retries
        client_kwargs = {"api_key": self.api_key, "timeout": 600.0}
        if self.base_url:
            client_kwargs["base_url"] = self.base_url
        self.client = OpenAI(**client_kwargs)
        self.translator = SymbolTranslator()
    
    @staticmethod
    def extract_problem_and_proof_old(data: Dict[str, Any]) -> tuple[str, str, str, str]:
        """Extract problem, conclusion, original_constructions and aux from the legacy format."""
        llm_input = data.get("llm_input_renamed", "")
        llm_output = data.get("llm_output_renamed", "")
        # Extract <problem>...</problem>
        problem_match = re.search(r'<problem>(.*?)</problem>', llm_input, re.DOTALL)
        problem = problem_match.group(1).strip() if problem_match else ""
        
        # Extract conclusion (goal): take the part after "?" from the problem string
        conclusion = ""
        if "?" in problem:
            conclusion = problem.split("?")[-1].strip()
            # Remove the conclusion part from problem; keep only the premises
            problem = problem.split("?")[0].strip()
        
        # Extract <aux>...</aux>
        aux = ""
        aux_match = re.search(r'<aux>(.*?)</aux>', llm_output, re.DOTALL)
        if aux_match:
            aux = aux_match.group(1).strip()
        
        return problem, conclusion, aux
    
    @staticmethod
    def extract_problem_and_proof(data: Dict[str, Any]) -> tuple[str, str, str]:
        """Extract problem (premises), conclusion, and aux from the new data format.
        
        The input `data` looks like:
        {
            "prob": "<problem> a : ; ... ? eqangle ... </problem>",
            "aux": "x00 h : coll ... ;",
            "difficulty": 10.875,
            ...
        }
        """
        prob_raw = data.get("prob", "")  # The full segment including the <problem> tag
        
        # 1) Extract the inner content of <problem> ... </problem>
        m = re.search(r'<problem>(.*?)</problem>', prob_raw, re.DOTALL)
        inner = m.group(1).strip() if m else prob_raw.strip()
        
        # 2) Split premises (problem) and conclusion from the inner content
        problem = inner
        conclusion = ""
        if "?" in inner:
            # Split only at the first "?"
            before_q, after_q = inner.split("?", 1)
            problem = before_q.strip()        # keep only the premises before "?"
            conclusion = after_q.strip()      # everything after "?" is the conclusion
        
        # 3) aux comes directly from the field (already the content itself, without <aux> tags)
        aux = data.get("aux", "")
        if aux is None:
            aux = ""
        aux = aux.strip()
        #print(problem, conclusion, aux)
        return problem, conclusion, aux
        
    @staticmethod
    def format_prompt(problem: str, conclusion: str, aux: str = "", problem_type: str = "computation") -> str:
        """Format the prompt for the LLM.
        
        Args:
            problem: Geometry premises/conditions
            conclusion: Conclusion/goal
            aux: Auxiliary construction(s)
            problem_type: Problem type: "computation" or "proof" (default: "computation")
        """
        if problem_type == "proof":
            # Proof mode
            prompt = """
    You are a professional geometry problem writer, expert in Euclidean plane geometry and contest-style geometry (e.g., AMC / AIME / math olympiads).

    [Goal]

    Given an input <problem> (geometry premises) and <conclusion> (the statement to prove), you must:
    1. Understand the described geometric configuration (points, segments, perpendicularity, parallelism, equal lengths, similarity, collinearity, etc.).
    2. Convert the symbolic premises and conclusion into a natural-language geometry proof problem.
    3. Provide a complete problem statement and a detailed proof (CoT), then conclude the proof.

    The statement must be purely geometric (no coordinate geometry).

    --------------------------------
    [Requirements]

    1. **Statement construction**
    - Convert the premises in <problem> into natural language.
    - Convert the conclusion in <conclusion> into the goal to be proved.
    - You may add reasonable auxiliary conditions (e.g., midpoint, angle bisector, internal/external division), but they must be consistent with the geometry in <problem>.
    - **Do not introduce new unknowns or extra parameters** in the statement/proof (e.g., new variables \(x,y,t,k\)). If you need quantitative relations, express them using already-given quantities (lengths, angles, ratios) or their combinations.

    2. **Proof goal**
    - End the statement with "Prove that: ..." and clearly specify the conclusion.
    - The goal may be:
      - two segments are equal or proportional;
      - two angles are equal or have a ratio;
      - points are collinear or concyclic;
      - lines are parallel or perpendicular;
      - triangles are similar or congruent;
      - other valid geometric relations.

    3. **Geometric consistency**
    - The problem must be logically consistent, non-contradictory, and provable.
    - Avoid obvious degenerate cases (e.g., three collinear points claimed to form a triangle).
    - If you introduce new points (e.g., intersection, foot, midpoint), define them clearly.
    - The premises must be sufficient to imply the conclusion.

    4. **Statement format**
    - Natural English with LaTeX math notation (e.g., \(AB\), \(\angle ABC\), \(S_{\\triangle ABC}\)).
    - Do not include reasoning text such as "conclusion" in the statement; only include construction and the proof goal.
    - The last sentence must be "Prove that: ..."

    5. **CoT proof**
    - Write the full proof as Step1 / Step2 / Step3 ...
    - Use LaTeX symbols and formulas.
    - Each step must cite the theorem/property used (e.g., congruence, similarity, parallel line angle properties, circle theorems).
    - Do not mention DSL, <problem>, symbolic predicates, etc. Reason only from the statement.
    - The proof must be clear and complete.

    6. **Answer format**
    - "answer": For proof problems, the answer can be "QED" or omitted (the system will handle it).
    - The focus is on the correctness/completeness of "question" and "cot"; "answer" is optional.

    --------------------------------
    [Input]

    <problem> {problem} </problem>
    <conclusion> {conclusion} </conclusion>
    {aux_section}

    [Output]

    Output only ONE JSON object:

    {{
    "question": "(English statement using LaTeX, ending with 'Prove that: ...')",
    "cot": "Step1 ...\\nStep2 ...\\nStep3 ...",
    "answer": "QED"  // optional; can be empty or the fixed value "QED"
    }}
    """
        else:
            # Computation mode (original logic)
            prompt = """
    You are a professional geometry problem writer, expert in Euclidean plane geometry and contest-style geometry (e.g., AMC / AIME / math olympiads).

    [Goal]

    Based on the input <problem> (geometry premises) and conclusion, you must:
    1. Understand the described geometric configuration (points, segments, perpendicularity, parallelism, equal lengths, similarity, collinearity, etc.).
    2. Design a high-quality, challenging numerical geometry problem based on this configuration (with exactly ONE target quantity to solve).
    3. Provide a complete problem statement, detailed reasoning (CoT), and the final numerical answer.

    The statement must be purely geometric (no coordinate geometry).

    --------------------------------
    [Requirements]

    1. **Numeric settings**
    - Assign reasonable numeric values to lengths, angles, ratios, etc. (prefer integers or simple fractions in the range 2–20, e.g., \( \\frac{3}{2}, \\frac{5}{3} \)).
    - Avoid overly trivial answers (avoid obvious results like 0, 1, 2; avoid answers that are identical to a given quantity).
    - You may add reasonable auxiliary conditions (e.g., midpoint, angle bisector, division point), but they must be consistent with the geometry in <problem>.

    2. **Target type (choose exactly ONE)**
    The statement must end with "Find ..." and include only one target, such as:
    - a segment length;
    - an angle measure or a trigonometric value;
    - a ratio of two segments;
    - area/perimeter of a triangle or quadrilateral;
    - circle-related measures (angles, arc length, area, etc.);
    - arithmetic combinations of the above (e.g., \(AB^2 + AC^2\), area ratios).

    3. **Geometric consistency**
    - The problem must be logically consistent, non-contradictory, and have a unique solution.
    - Avoid degenerate cases (e.g., three collinear points claimed to form a triangle).
    - If you introduce new points (e.g., intersection, foot, midpoint), define them clearly.

    4. **Statement format**
    - Natural English with LaTeX math notation (e.g., \(AB\), \(\angle ABC\), \(S_{\\triangle ABC}\)).
    - Do not include reasoning text such as "conclusion" in the statement; only include construction.
    - The last sentence must end with "Find ..."

    5. **CoT reasoning**
    - Write as Step1 / Step2 / Step3 ...
    - Use LaTeX symbols and formulas.
    - Do not mention DSL, <problem>, symbolic predicates, etc. Reason only from the statement.

    6. **Answer format**
    - "answer": Provide only the final numeric value or expression, e.g., "\\frac{15}{2}", "5\\sqrt{3}".
    - Do not add any explanatory text.

    --------------------------------
    [Input]

    <problem> {problem} </problem>
    <conclusion> {conclusion} </conclusion>
    {aux_section}

    [Output]

    Output only ONE JSON object:

    {{
    "question": "(English statement using LaTeX)",
    "cot": "Step1 ...\\nStep2 ...\\nStep3 ...",
    "answer": "(Final numeric result only)"
    }}
    """

        aux_section = ""
        if aux and aux.strip():
            aux_section = f"<aux> {aux} </aux>\n"

        # Avoid .format consuming all braces {}: only replace our placeholders
        prompt = prompt.replace("{problem}", problem)
        prompt = prompt.replace("{conclusion}", conclusion)
        prompt = prompt.replace("{aux_section}", aux_section)

        return prompt



    def call_llm(self, prompt: str) -> Dict[str, Any]:
        """Call the LLM API."""
        #input()
        #print(self.max_retries)
        for attempt in range(self.max_retries):
            try:
                completion = self.client.chat.completions.create(
                    model=self.model,
                    messages=[
                        {
                            "role": "user",
                            "content": prompt,
                        },
                    ],
                    temperature=0.7,
                    max_tokens=32767 * 2,
                    reasoning_effort="high"
                )
                choice = completion.choices[0]
                response = choice.message
                finish_reason = getattr(choice, "finish_reason", None)
                
                if finish_reason == "length":
                    raise Exception(
                        "The LLM response was truncated (finish_reason=length). "
                        "Please increase max_tokens or shorten the prompt."
                    )
                return {
                    "content": response.content if response else "",
                    "usage": completion.usage,
                    "finish_reason": finish_reason,
                }
                
            except Exception as e:
                if attempt < self.max_retries - 1:
                    wait_time = 2 ** attempt
                    print(f"Attempt {attempt + 1} failed; retrying in {wait_time} seconds... ({e})")
                    time.sleep(wait_time)
                    continue
                raise Exception(f"API call failed (retried {self.max_retries} times): {e}")
        
        raise Exception("Reached maximum retry count.")
    
    @staticmethod
    def _serialize_usage(usage_obj) -> Optional[Dict[str, int]]:
        """
        Convert a usage object into a JSON-serializable dict.
        
        Args:
            usage_obj: usage object (may be a CompletionUsage object or a dict)
            
        Returns:
            A dict-form usage. Returns None if it cannot be converted.
        """
        if usage_obj is None:
            return None
        
        # If it's already a dict, return it directly
        if isinstance(usage_obj, dict):
            return {
                "prompt_tokens": usage_obj.get("prompt_tokens", 0) or 0,
                "completion_tokens": usage_obj.get("completion_tokens", 0) or 0,
                "total_tokens": usage_obj.get("total_tokens", 0) or 0,
            }
        
        # If it's an object, extract attributes
        try:
            prompt_tokens = getattr(usage_obj, 'prompt_tokens', None)
            completion_tokens = getattr(usage_obj, 'completion_tokens', None)
            total_tokens = getattr(usage_obj, 'total_tokens', None)
            
            # If attributes exist, convert to dict
            if prompt_tokens is not None or completion_tokens is not None or total_tokens is not None:
                return {
                    "prompt_tokens": int(prompt_tokens) if prompt_tokens is not None else 0,
                    "completion_tokens": int(completion_tokens) if completion_tokens is not None else 0,
                    "total_tokens": int(total_tokens) if total_tokens is not None else 0,
                }
        except Exception:
            pass
        
        return None
    
    @staticmethod
    def extract_json_from_response(response_text: str) -> Optional[Dict[str, Any]]:
        """Extract a JSON object from a model response text."""
        if not response_text:
            return None

        stripped = response_text.strip()

        # 1) Direct parse
        try:
            return json.loads(stripped)
        except json.JSONDecodeError:
            pass

        # 2) Parse a ```json ... ``` code block
        # Find the start of the JSON object inside the code block
        code_block_match = re.search(r"```(?:json)?\s*(\{)", response_text, re.DOTALL)
        if code_block_match:
            start_pos = code_block_match.start(1)  # JSON object start position
            json_text = response_text[start_pos:]
            
            # Find the end marker (if present)
            if "```" in json_text[1:]:  # Search from the 2nd char to avoid matching the opening fence
                end_marker = json_text.find("```", 1)
                if end_marker > 0:
                    json_text = json_text[:end_marker].rstrip()
            
            # Try parsing first
            decoder = json.JSONDecoder()
            try:
                obj, end_pos = decoder.raw_decode(json_text)
                if isinstance(obj, dict):
                    return obj
            except json.JSONDecodeError:
                # If parsing fails, string values may contain unescaped control characters or backslashes.
                # Fix by escaping unescaped control characters and backslashes inside string values.
                def fix_string_value(match):
                    key_part = match.group(1)  # "key":
                    value = match.group(2)     # Raw value content
                    tail = match.group(3)      # Closing quote

                    fixed_value = value
                    # 1) newline/tab/carriage return -> escaped
                    fixed_value = re.sub(r'(?<!\\)\n', r'\\n', fixed_value)
                    fixed_value = re.sub(r'(?<!\\)\t', r'\\t', fixed_value)
                    fixed_value = re.sub(r'(?<!\\)\r', r'\\r', fixed_value)
                    # 2) backslash + letter -> double backslash (to protect LaTeX)
                    fixed_value = re.sub(r'(?<!\\)\\(?=[a-zA-Z])', r'\\\\', fixed_value)
                    # 3) unescaped double quote -> \"
                    fixed_value = re.sub(r'(?<!\\)"', r'\\"', fixed_value)

                    return key_part + fixed_value + tail

                try:
                    # Match all string values and fix them
                    fixed_json = re.sub(
                        r'("(?:question|cot|answer)"\s*:\s*")(.*?)(")',
                        fix_string_value,
                        json_text,
                        flags=re.DOTALL
                    )
                    # Try parsing again
                    obj, _ = decoder.raw_decode(fixed_json)
                    if isinstance(obj, dict):
                        return obj
                except (json.JSONDecodeError, Exception):
                    pass

        # 3) Parse the first "{ ... }" substring (try to find a valid JSON object)
        decoder = json.JSONDecoder()
        for idx, ch in enumerate(response_text):
            if ch != "{":
                continue
            try:
                obj, _ = decoder.raw_decode(response_text[idx:])
                if isinstance(obj, dict):
                    return obj
            
            except json.JSONDecodeError:
                    continue

        return None
    
    def generate(self, row_data: Dict[str, Any], index: Optional[int] = None, problem_type: Optional[str] = None) -> Dict[str, Any]:
        """
        Generate one problem.
        
        Args:
            row_data: Input data
            index: Optional index (for logging)
            problem_type: "computation" or "proof". If None, read from row_data; default is "computation".
        
        Returns:
            A result dict containing:
            - success: bool
            - generated: generated JSON (if success)
            - llm_response: raw LLM response
            - error: error message (if failed)
        """
        # Determine problem type: prefer argument, then row_data, then default to proof
        if problem_type is None:
            problem_type = row_data.get("problem_type", "proof")
        problem_type = problem_type.lower()
        if problem_type not in ["computation", "proof"]:
            problem_type = "proof"  # default
        # Use the same retry count as call_llm
        for attempt in range(self.max_retries):
            try:
                # Extract problem, conclusion, and aux
                problem, conclusion, aux = self.extract_problem_and_proof(row_data)
                
                if not problem:
                    return {
                        "success": False,
                        "error": "Failed to extract problem.",
                    }
                
                # Translate the symbolic language into natural language
                # First try translate_problem_origin for the problem_origin format
                # If problem looks like problem_origin format (contains patterns like "a :"), use translate_problem_origin
                if re.search(r'\w+\s*:\s*', problem):
                    problem_nl = self.translator.translate_problem_origin(problem)
                    if not problem_nl:
                        # If translation fails, try translate_problem
                        problem_nl = self.translator.translate_problem(problem, simplify=True)
                        if not problem_nl:
                            problem_nl = problem
                            if index is not None:
                                print(f"[Sample {index}] Failed to translate problem; using original problem.")
                else:
                    # Otherwise use translate_problem
                    problem_nl = self.translator.translate_problem(problem, simplify=True)
                    if not problem_nl:
                        # If translation fails, use original problem
                        problem_nl = problem
                        if index is not None:
                            print(f"[Sample {index}] Failed to translate problem; using original problem.")
                
                # Translate conclusion
                conclusion_nl = ""
                if conclusion:
                    # conclusion may be a simple predicate (e.g., "coll a b c") or a full proof format
                    # First try parsing as a simple predicate
                    conclusion_stripped = conclusion.strip()
                    # Match a simple predicate format: predicate arg1 arg2 ...
                    predicate_match = re.match(r'^(\w+)\s+(.+)$', conclusion_stripped)
                    if predicate_match:
                        pred_name = predicate_match.group(1)
                        args_str = predicate_match.group(2).strip()
                        args = [a.strip() for a in args_str.split() if a.strip()]
                        # Try translating the predicate directly
                        translation = self.translator.translate_predicate(pred_name, args)
                        if translation:
                            conclusion_nl = translation
                        else:
                            # If direct translation fails, try translating as proof format
                            conclusion_nl = self.translator.translate_proof(conclusion, simplify=True)
                            if not conclusion_nl:
                                conclusion_nl = conclusion
                                if index is not None:
                                    print(f"[Sample {index}] Failed to translate conclusion; using original conclusion: {conclusion}")
                    else:
                        # If it doesn't match the simple predicate format, translate as proof format
                        conclusion_nl = self.translator.translate_proof(conclusion, simplify=True)
                        if not conclusion_nl:
                            conclusion_nl = conclusion
                            if index is not None:
                                print(f"[Sample {index}] Failed to translate conclusion; using original conclusion: {conclusion}")
                
                # Translate aux (if present)
                aux_nl = ""
                if aux:
                    # aux is similar to problem; use translate_problem_origin or translate_problem
                    if re.search(r'\w+\s*:\s*', aux):
                        aux_nl = self.translator.translate_problem_origin(aux)
                        if not aux_nl:
                            aux_nl = self.translator.translate_problem(aux.replace('?', ''), simplify=True)
                            if not aux_nl:
                                aux_nl = aux
                    else:
                        aux_nl = self.translator.translate_problem(aux.replace('?', ''), simplify=True)
                        if not aux_nl:
                            aux_nl = aux
                
                # Log translated/original snippets for debugging and auditing
                prompt_payload = {
                    "problem_translated": problem_nl,
                    "problem_original": problem,
                    "conclusion_translated": conclusion_nl,
                    "conclusion_original": conclusion,
                    "aux_translated": aux_nl if aux else None,
                    "aux_original": aux if aux else None,
                }
                #print(prompt_payload)

                # Format prompt using translated natural language
                prompt = self.format_prompt(problem_nl, conclusion_nl, aux_nl, problem_type=problem_type)
                #print(prompt)
                # Call LLM
                import time as time_module
                if index is not None:
                    print(f"[Sample {index}] Calling API to generate a problem...")
                call_start_time = time_module.time()
                api_response = self.call_llm(prompt)
                call_elapsed_time = time_module.time() - call_start_time
                
                llm_response = api_response.get("content", "")
                finish_reason = api_response.get("finish_reason")
                usage = api_response.get("usage")
                
                # Record call details
                call_details = {
                    "timestamp": time_module.time(),
                    "elapsed_time": call_elapsed_time,
                    "response_length": len(llm_response) if llm_response else 0,
                    "finish_reason": finish_reason,
                    "usage": self._serialize_usage(usage) if usage else None,
                }
                
                if index is not None:
                    print(
                        f"[Sample {index}] API call elapsed: {call_elapsed_time:.2f}s, "
                        f"response length: {len(llm_response) if llm_response else 0}, "
                        f"finish_reason: {finish_reason}"
                    )
                
                # Extract JSON
                result_json = self.extract_json_from_response(llm_response)
                
                if result_json:
                    # Validate required fields
                    # For proof problems, the answer field is optional; fill it automatically if missing
                    if problem_type == "proof" and "answer" not in result_json:
                        result_json["answer"] = "QED"
                    
                    if "question" in result_json and ("answer" in result_json or problem_type == "proof"):
                        # For computation problems, check whether the answer can be parsed as a number
                        # For proof problems, the answer can be text (e.g., "QED"), no numeric validation needed
                        if problem_type == "computation":
                            answer_value = latex_to_float(result_json.get("answer"))
                            if answer_value is None:
                                # Answer cannot be parsed as a number -> retry
                                if attempt < self.max_retries - 1:
                                    wait_time = 2 ** attempt
                                    answer_str = result_json.get("answer", "")
                                    print(f"[Sample {index}] Attempt {attempt + 1}/{self.max_retries} failed: answer is not parseable as a number (answer: {answer_str[:50]}...), retrying in {wait_time} seconds...")
                                    time.sleep(wait_time)
                                    continue
                                return {
                                    "success": False,
                                    "error": f"Answer is not parseable as a number: {result_json.get('answer', '')}",
                                    "llm_response": llm_response,
                                    "prompt_payload": prompt_payload,
                                    "prompt_text": prompt,
                                    "usage": usage,
                                    "finish_reason": finish_reason,
                                    "call_details": call_details,
                                }
                            
                            # Answer is parseable -> success
                            if index is not None:
                                print(f"[Sample {index}] Successfully generated a problem; parsed answer: {answer_value}")
                        else:
                            # Proof problem: answer may be text; no numeric validation
                            answer_str = result_json.get("answer", "")
                            if index is not None:
                                print(f"[Sample {index}] Successfully generated a proof problem; answer: {answer_str[:100]}...")
                        return {
                            "success": True,
                            "generated": result_json,
                            "llm_response": llm_response,
                            "prompt_payload": prompt_payload,
                            "prompt_text": prompt,
                            "usage": usage,
                            "finish_reason": finish_reason,
                            "call_details": call_details,
                        }
                    else:
                        # Check missing fields
                        missing_fields = []
                        if "question" not in result_json:
                            missing_fields.append("question")
                        if problem_type == "computation" and "answer" not in result_json:
                            missing_fields.append("answer")
                        
                        if missing_fields:
                            # If this is not the last attempt, retry; otherwise return error
                            if attempt < self.max_retries - 1:
                                wait_time = 2 ** attempt
                                print(f"[Sample {index}] Attempt {attempt + 1}/{self.max_retries} failed: generated JSON is missing required fields: {missing_fields}. Retrying in {wait_time} seconds...")
                                time.sleep(wait_time)
                                continue
                            return {
                                "success": False,
                                "error": f"Generated JSON is missing required fields: {missing_fields}",
                                "llm_response": llm_response,
                                "prompt_payload": prompt_payload,
                                "prompt_text": prompt,
                                "usage": usage,
                                "finish_reason": finish_reason,
                                "call_details": call_details,
                            }
                        else:
                            # In theory we shouldn't reach here (if question exists and it's a proof problem,
                            # it should have been handled above). For safety, if question exists for a proof
                            # problem, fill answer and proceed.
                            if problem_type == "proof" and "question" in result_json:
                                if "answer" not in result_json:
                                    result_json["answer"] = "QED"
                                # Re-enter success handling
                                answer_str = result_json.get("answer", "")
                                if index is not None:
                                    print(f"[Sample {index}] Successfully generated a proof problem; answer: {answer_str[:100]}...")
                                return {
                                    "success": True,
                                    "generated": result_json,
                                    "llm_response": llm_response,
                                    "prompt_payload": prompt_payload,
                                    "prompt_text": prompt,
                                    "usage": usage,
                                    "finish_reason": finish_reason,
                                    "call_details": call_details,
                                }
                else:
                    error_msg = "Failed to extract JSON from the response."
                    if llm_response:
                        error_msg += f" (response length: {len(llm_response)}, first 100 chars: {llm_response[:100]})"
                    # If not the last attempt, retry; otherwise return error
                    if attempt < self.max_retries - 1:
                        wait_time = 2 ** attempt
                        print(f"[Sample {index}] Attempt {attempt + 1}/{self.max_retries} failed: {error_msg} Retrying in {wait_time} seconds...")
                        time.sleep(wait_time)
                        continue
                    return {
                        "success": False,
                        "error": error_msg,
                        "llm_response": llm_response,
                        "finish_reason": finish_reason,
                        "prompt_payload": prompt_payload,
                        "prompt_text": prompt,
                        "usage": usage,
                        "call_details": call_details,
                    }
            
            except Exception as e:
                if index is not None:
                    print(f"[Sample {index}] Processing failed: {e}")
                # If not the last attempt, retry; otherwise return error
                if attempt < self.max_retries - 1:
                    wait_time = 2 ** attempt
                    print(f"[Sample {index}] Attempt {attempt + 1}/{self.max_retries} failed; retrying in {wait_time} seconds...")
                    time.sleep(wait_time)
                    continue
                return {
                    "success": False,
                    "error": str(e),
                }

