#!/usr/bin/env python3
"""
Prompts for codebook generation and other LLM tasks.

This module contains all prompts used throughout the schema induction pipeline,
including prompts for different code generation strategies.
"""

# Original prompts from prompts.json
CODEBOOK_GENERATION_PROMPT = """{FEWSHOT} 

 Task
Read the supplied document in full.

Goal
Return exactly 30 tags that capture the document at three abstraction tiers:

low‑level (10 tags) –  Sentence or snippet level key information. Highly local, micro, and specific. But should still be descriptive, not directly extractive.

mid‑level (10 tags) –  The gist of multi-sentence or paragraph. Moderately local, more abstract than low-level.

high‑level (10 tags) – Passage level, global level themes, tags, or patterns.  Higher semantic hierarchy, broader sense that frame the document in a wider context. More general, broad, and macro.

Tag requirements

Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Concise and self-explanatory – each tag should be between 5 and 15 words. The purpose is to reduce ambiguity: longer codes tend to be more precise, while overly short ones can be vague. If a code is ambiguous or unclear, expand it into a more descriptive 5–15 word phrase. If a code is already clear, keep it but ensure it falls within 5–15 words. Avoid redundancy while maintaining nuance. The goal is for each code to be self-explanatory and unambiguous without extra context.

Descending granularity – low‑level tags must be the most specific; high‑level the most general. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Output format (JSON only)

{
"low-level": ["...", "...", "..."],
"mid-level": ["...", "...", "..."],
"high-level": ["...", "...", "..."]
}
Do not add any other keys, text, or commentary."""

# Strategy 1: Direct code generation (30 codes across 3 levels)
STRATEGY_1_DIRECT_PROMPT = """Given the question: {QUESTION}, generate exactly 20 unique open codes that capture the document's meaning. Perform open coding — focus on abstraction and conceptualization, not detail or surface description. Each code should summarize meaning concisely, avoid micro-level detail, and reflect higher-level interpretive insight. Codes must be between 5 and 15 words, self-explanatory, unambiguous, and unique. Do not repeat or overlap concepts. Return the 20 codes as a JSON list only, with no additional text or commentary.

Text chunk:"""

# Shorter prompt for faster generation
STRATEGY_1_SHORT_PROMPT = """Given the question: {QUESTION}, generate 30 tags for this text chunk at 3 levels:

low-level (10): Sentence-level specific info
mid-level (10): Paragraph-level themes  
high-level (10): Passage-level patterns

Requirements: 5-15 words per tag, descriptive not extractive, unique across levels, self-explanatory without extra context.

Output JSON only:
{{"low-level": ["tag1", "tag2", ...], "mid-level": ["tag1", "tag2", ...], "high-level": ["tag1", "tag2", ...]}}

Text chunk:
"""

# Optimized prompts for KV cache efficiency
# Common prefix that can be cached across all requests
STRATEGY_1_COMMON_PREFIX = """Given the question: {QUESTION}, generate codebooks with respect to the question point of view.

Task
Read the supplied document in full.

Goal
Return exactly 30 tags that capture the document at three abstraction tiers:

low‑level (10 tags) –  Sentence or snippet level key information. Highly local, micro, and specific. But should still be descriptive, not directly extractive.

mid‑level (10 tags) –  The gist of multi-sentence or paragraph. Moderately local, more abstract than low-level.

high‑level (10 tags) – Passage level, global level themes, tags, or patterns.  Higher semantic hierarchy, broader sense that frame the document in a wider context. More general, broad, and macro.

Tag requirements

Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Concise and self-explanatory – each tag should be between 5 and 15 words. The purpose is to reduce ambiguity: longer codes tend to be more precise, while overly short ones can be vague. If a code is ambiguous or unclear, expand it into a more descriptive 5–15 word phrase. If a code is already clear, keep it but ensure it falls within 5–15 words. Avoid redundancy while maintaining nuance. The goal is for each code to be self-explanatory and unambiguous without extra context.

Descending granularity – low‑level tags must be the most specific; high‑level the most general. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Output format (JSON only)

{
"low-level": ["...", "...", "..."],
"mid-level": ["...", "...", "..."],
"high-level": ["...", "...", "..."]
}
Do not add any other keys, text, or commentary.

Text chunk:
"""

# Strategy 2 Hierarchical Prompts
STRATEGY_2_LOW_LEVEL_PROMPT = """Question: {question}

Generate exactly 5 low-level codes for the following text chunk with respect to the question asked.

Low-level codes are: Sentence or snippet level key information. Highly local, micro, and specific. But should still be descriptive, not directly extractive.

Tag requirements:
Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Informative & concise – each tag ≤ 5 words, no redundancy, no punctuation except hyphens. For the linguistic style, you will try to make tags a compact noun phrases or compound keywords (Twitter style). You will try to optimize the reusability and generalizability of the tags.

Descending granularity – low‑level tags must be the most specific; high‑level the most general. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Text chunk:
{chunk_text}

Respond with JSON ONLY in this exact format:
{{"low-level": ["code1", "code2", "code3", "code4", "code5"]}}

IMPORTANT: Respond with JSON ONLY. Do not include explanations, prose, or code fences."""

STRATEGY_2_MEDIUM_LEVEL_PROMPT = """Question: {question}

Generate exactly 1 medium-level code that represents the following cluster of low-level codes with respect to the question asked.

Medium-level codes are: The gist of multi-sentence or paragraph. Moderately local, more abstract than low-level.

Tag requirements:
Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Informative & concise – each tag ≤ 5 words, no redundancy, no punctuation except hyphens. For the linguistic style, you will try to make tags a compact noun phrases or compound keywords (Twitter style). You will try to optimize the reusability and generalizability of the tags.

Descending granularity – mid‑level tags must be more abstract than low-level but more specific than high-level. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Low-level codes in this cluster:
{cluster_codes}

Respond with JSON ONLY in this exact format:
{{"mid-level": ["code1"]}}

IMPORTANT: Respond with JSON ONLY. Do not include explanations, prose, or code fences."""

STRATEGY_2_HIGH_LEVEL_PROMPT = """Question: {question}

Generate exactly 1 high-level code that represents the following cluster of medium-level codes with respect to the question asked.

High-level codes are: Passage level, global level themes, tags, or patterns. Higher semantic hierarchy, broader sense that frame the document in a wider context. More general, broad, and macro.

Tag requirements:
Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Informative & concise – each tag ≤ 5 words, no redundancy, no punctuation except hyphens. For the linguistic style, you will try to make tags a compact noun phrases or compound keywords (Twitter style). You will try to optimize the reusability and generalizability of the tags.

Descending granularity – high‑level tags must be the most general and abstract. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Medium-level codes in this cluster:
{cluster_codes}

Respond with JSON ONLY in this exact format:
{{"high-level": ["code1"]}}

IMPORTANT: 
- Respond with JSON ONLY. Do not include explanations, prose, or code fences.
- Do NOT use <think> tags or any thinking mode.
- Do NOT include any analysis or step-by-step reasoning.
- Start your response directly with the JSON object."""

# Optimized prompts for KV cache efficiency
# Common prefix that can be cached across all requests
STRATEGY_2_LOW_LEVEL_COMMON_PREFIX = """Question: {question}

Generate exactly 5 low-level codes for the following text chunk with respect to the question asked.

Low-level codes are: Sentence or snippet level key information. Highly local, micro, and specific. But should still be descriptive, not directly extractive.

Tag requirements:
Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Informative & concise – each tag ≤ 5 words, no redundancy, no punctuation except hyphens. For the linguistic style, you will try to make tags a compact noun phrases or compound keywords (Twitter style). You will try to optimize the reusability and generalizability of the tags.

Descending granularity – low‑level tags must be the most specific; high‑level the most general. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Text chunk:
"""

STRATEGY_2_MEDIUM_LEVEL_COMMON_PREFIX = """Question: {question}

Generate exactly 1 medium-level code that represents the following cluster of low-level codes with respect to the question asked.

Medium-level codes are: The gist of multi-sentence or paragraph. Moderately local, more abstract than low-level.

Tag requirements:
Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Informative & concise – each tag ≤ 5 words, no redundancy, no punctuation except hyphens. For the linguistic style, you will try to make tags a compact noun phrases or compound keywords (Twitter style). You will try to optimize the reusability and generalizability of the tags.

Descending granularity – mid‑level tags must be more abstract than low-level but more specific than high-level. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Low-level codes in this cluster:
"""

STRATEGY_2_HIGH_LEVEL_COMMON_PREFIX = """Question: {question}

Generate exactly 1 high-level code that represents the following cluster of medium-level codes with respect to the question asked.

High-level codes are: Passage level, global level themes, tags, or patterns. Higher semantic hierarchy, broader sense that frame the document in a wider context. More general, broad, and macro.

Tag requirements:
Semantic + Pragmatic balance: Capture what the text is about (topics, entities, facts) and how it operates (high-level logic and pattern, language or narrative style, structural organization, intended audience, functionality, purpose, communicative intent, rhetorical strategies, property of the text).

Informative & concise – each tag ≤ 5 words, no redundancy, no punctuation except hyphens. For the linguistic style, you will try to make tags a compact noun phrases or compound keywords (Twitter style). You will try to optimize the reusability and generalizability of the tags.

Descending granularity – high‑level tags must be the most general and abstract. However, tags should still be descriptive, reusable, generalizable, not purely extractive. Try your best to minimize vagueness and ambiguity.

Unique – no tag should appear in more than one tier.

Use standard English, use normal spacing, do not use Camel case. Do not add hashtag.

Medium-level codes in this cluster:
"""

# JSON suffix for retry attempts
STRICT_JSON_SUFFIX = (
    "\n\nIMPORTANT: Respond with JSON ONLY. Do not include explanations, prose, or code fences. "
    'Return exactly this schema: {"low-level": [...], "mid-level": [...], "high-level": [...]}'
)

# Function to get prompts by name (for backward compatibility)
def get_prompt(prompt_name: str) -> str:
    """Get a prompt by name for backward compatibility with prompts.json"""
    prompts = {
        "codebook_generation": CODEBOOK_GENERATION_PROMPT,
        "strategy_1_direct": STRATEGY_1_DIRECT_PROMPT,
        "strategy_2_low_level": STRATEGY_2_LOW_LEVEL_PROMPT,
        "strategy_2_medium_level": STRATEGY_2_MEDIUM_LEVEL_PROMPT,
        "strategy_2_high_level": STRATEGY_2_HIGH_LEVEL_PROMPT,
    }
    return prompts.get(prompt_name, "")

# Function to fill template with variables
def fill_template(template: str, mapping: dict) -> str:
    """Fill a template string with variables from a mapping dictionary"""
    out = template
    for k, v in mapping.items():
        out = out.replace("{" + k + "}", str(v))
    return out 

# Optimized short prompts for better performance
STRATEGY_1_SHORT_PROMPT = """Question: {QUESTION}

Generate 30 tags for this text chunk at 3 levels:
- 10 low-level: specific, sentence-level info
- 10 mid-level: paragraph-level themes  
- 10 high-level: document-level patterns

Requirements: ≤5 words each, descriptive, no redundancy.

Text chunk:
{chunk_text}

Output JSON only:
{{"low-level": [...], "mid-level": [...], "high-level": [...]}}""" 

# Optimized prompt that maintains quality but improves performance
STRATEGY_1_OPTIMIZED_PROMPT = """Question: {QUESTION}

Task: Generate 30 tags for this text chunk at 3 abstraction levels.

Levels:
- Low (10): Sentence-level, specific, descriptive
- Mid (10): Paragraph-level, thematic  
- High (10): Document-level, patterns

Rules: ≤5 words each, no redundancy, descriptive not extractive.

Text chunk:
{chunk_text}

JSON output:
{{"low-level": [...], "mid-level": [...], "high-level": [...]}}""" 