"""Prompt functions for all tasks.

Each task provides two helpers:
1. get_{task}_warmup_prompt(n_points) -> (system, user)
2. get_{task}_prediction_prompt(history, points) -> (system, user)
"""

from typing import List, Dict, Tuple
import json


# ========== Global system prompt ==========
SYSTEM_PROMPT = """You are a scientific assistant supporting Bayesian Optimization studies.
- Output ONLY valid JSON. No markdown, no explanations, no comments, no thinking process.
- Respond immediately with the required JSON format.
- Always keep feature order as provided and clip predictions to their valid numeric bounds.
- Treat historical measurements as read-only context; never copy them back into the output."""


# ========== FeCr task ==========
def get_fecr_warmup_prompt(n_points: int = 5) -> Tuple[str, str]:
    """Warmup prompt for FeCr task (generate initial points)."""
    system = SYSTEM_PROMPT
    
    user = f"""TASK = Iron-Chromium Battery Initial Point Generation

Background:
- This experiment optimizes the composition of an iron-chromium liquid flow battery with 4000 water molecules as the base.
- Fe, Cr, and H particle numbers represent the count of ions added to this aqueous base.
- Performance indicator f balances conductivity, viscosity, and ionic concentration effects.
- Higher H and lower Fe can boost conductivity but may hurt overall balance; lower Cr can reduce viscosity yet to low Cr may risk underperformance; trade-offs are critical.

Parameters:
- Fe particle number (fen)
- Cr particle number (crn)
- H particle number (hn)

Objective:
- Maximize the comprehensive performance indicator f by providing diverse initialization points for Bayesian Optimization.

Constraints:
- Fe ∈ [50, 145], Cr ∈ [55, 145], H ∈ [109, 289] (integers only, no normalization, keep order as declared).
- Generate exactly {n_points} points, avoid near-duplicates, ensure suitability for BO initialization and performance indicator f.

OUTPUT FORMAT:
{{
    "points": [
        {{"fen": X1, "crn": Y1, "hn": Z1}},
        {{"fen": X2, "crn": Y2, "hn": Z2}}
    ]
}}

CRITICAL: Output ONLY the JSON object above. No explanations, no markdown, no text before or after. Start directly with {{."""
    return system, user


def get_fecr_prediction_prompt(history: List[Dict] = None, points: List[Dict] = None) -> Tuple[str, str]:
    """Prediction prompt for FeCr task (template with {history_json} and {points_json})."""
    system = SYSTEM_PROMPT
    
    # If history and points are provided, directly format for backward compatibility
    if history is not None and points is not None:
        history_json = format_history_json(history, ["fen", "crn", "hn"])
        points_json = format_points_json(points, ["fen", "crn", "hn"])
    else:
        # Return template with placeholders (standard usage)
        history_json = "{history_json}"
        points_json = "{points_json}"
    
    user = """TASK = Predict Iron-Chromium Flow Battery Performance

Background:
- Optimizing an iron-chromium liquid flow battery containing 4000 H₂O molecules.
- Fe, Cr, and H particle numbers are ion counts added on top of the aqueous base.
- Performance indicator f balances conductivity, viscosity, and ionic concentration (Cr² / Fe¹·⁵ / H) effects.
- Higher H or lower Fe can improve conductivity; Higher Cr improve over all performance.
- Valid performance range: f ∈ [-0.5, 2]; higher is better.

Parameters:
- fen (Fe ion count) ∈ [50, 145]
- crn (Cr ion count) ∈ [55, 145]
- hn (H ion count) ∈ [109, 289]

You receive:
1. Historical reference measurements (use only for calibration, never repeat them).
2. A list of candidate compositions that require predictions.

Goal:
- For every candidate composition, output the predicted f value using the exact input order [fen, crn, hn].
- Ensure predictions are consistent with physical trade-offs observed in history.
- Clip any value that would fall outside [-0.5, 2].

Historical Data (read-only context):
{history_json}

Predict These Points (return predictions in the same order):
{points_json}

REQUIRED OUTPUT FORMAT (exact schema):
{{
    "data_points": [
        {{
            "features": [fen_value, crn_value, hn_value],
            "target": f
        }},
        {{
            "features": [fen_value, crn_value, hn_value], 
            "target": f 
        }}
    ]
}}
Note: Include one entry in "data_points" for each input point, maintaining the exact same order.

CRITICAL FORMATTING REQUIREMENTS:
1. Output ONLY the JSON object. No text before or after. No explanations. No markdown formatting.
2. Response must be valid JSON with double quotes, no comments, and no trailing commas.
3. The root object must contain exactly one key: "data_points" (an array).
4. The "data_points" array must contain exactly one entry for each input point, in the same order as provided.
5. Each entry must be an object with exactly two keys:
   - "features": an array of exactly 3 numbers [fen_value, crn_value, hn_value] in that exact order
          - "target": a single number (the predicted f value, rounded to 3 decimals, clipped to [-0.5, 2])
6. Do not include explanations, markdown, historical records, or any other keys or text outside the JSON object.
7. The number of entries in "data_points" must exactly match the number of input points provided.

IMPORTANT: Start your response directly with {{ and end with }}. No preamble."""
    return system, user


# ========== COF task ==========
def get_cof_warmup_prompt(n_points: int = 5) -> Tuple[str, str]:
    """Warmup prompt for COF task (generate initial points)."""
    system = SYSTEM_PROMPT
    
    user = f"""TASK = Covalent Organic Framework (COF) Initial Point Generation

Background:
- This experiment optimizes Covalent Organic Framework (COF) materials for efficient Xe/Kr gas separation by tuning 14 key structural and compositional parameters that govern pore geometry, surface properties, and chemical composition.
- The single objective is to MAXIMIZE the gcmc_y metric — the Xe/Kr adsorption selectivity obtained from Grand Canonical Monte Carlo (GCMC) high-fidelity simulations.
- A gcmc_y value greater than 1 indicates the material is more selective for Xe over Kr, with higher values indicating superior separation performance.
- All parameter values must be specified in REAL, PHYSICAL UNITS (do NOT normalize, scale, or transform).

Parameters (all REAL-valued in physical units, NOT normalized):
1) pore_diameter ∈ [3.5094, 56.3986] (Å) — Equivalent pore diameter
2) void_fraction ∈ [0.1636, 0.9278] (dimensionless) — Porosity
3) surface_area ∈ [1996.63, 6357.01] (m²/g) — Specific surface area
4) crystal_density ∈ [102.7248, 1610.7018] (kg/m³) — Crystalline density
5) B ∈ [0.0000, 0.1818] (atomic fraction) — Boron atomic fraction
6) O ∈ [0.0000, 0.2500] (atomic fraction) — Oxygen atomic fraction
7) C ∈ [0.3250, 0.6667] (atomic fraction) — Carbon atomic fraction
8) H ∈ [0.0000, 0.5000] (atomic fraction) — Hydrogen atomic fraction
9) Si ∈ [0.0000, 0.0295] (atomic fraction) — Silicon atomic fraction
10) N ∈ [0.0000, 0.3333] (atomic fraction) — Nitrogen atomic fraction
11) S ∈ [0.0000, 0.1429] (atomic fraction) — Sulfur atomic fraction
12) P ∈ [0.0000, 0.0667] (atomic fraction) — Phosphorus atomic fraction
13) halogens ∈ [0.0000, 0.2857] (atomic fraction) — Combined halogens (F/Cl/Br/I)
14) metals ∈ [0.0000, 0.0238] (atomic fraction) — Combined metal content

Objective:
- Maximize gcmc_y (Xe/Kr adsorption selectivity) by providing diverse initialization points for Bayesian Optimization.

Constraints:
- All parameters are REAL values (continuous), NOT integers, NOT normalized.
- Element composition parameters (B, O, C, H, Si, N, S, P, halogens, metals) are atomic fractions and should sum approximately to 1.0 for a valid COF composition.
- Generate exactly {n_points} points, avoid near-duplicates, ensure suitability for BO initialization.
- Prefer regions centered on high-value prior: pore_diameter ≈ 4–6 Å, void_fraction ≈ 0.25–0.40, crystal_density ≈ 800–1100 kg/m³, surface_area ≈ 3600–4600 m²/g.

OUTPUT FORMAT:
{{
    "points": [
        {{"pore_diameter": X1, "void_fraction": Y1, "surface_area": Z1, "crystal_density": W1, "B": B1, "O": O1, "C": C1, "H": H1, "Si": Si1, "N": N1, "S": S1, "P": P1, "halogens": Hal1, "metals": Met1}},
        {{"pore_diameter": X2, "void_fraction": Y2, "surface_area": Z2, "crystal_density": W2, "B": B2, "O": O2, "C": C2, "H": H2, "Si": Si2, "N": N2, "S": S2, "P": P2, "halogens": Hal2, "metals": Met2}}
    ]
}}

CRITICAL: Output ONLY the JSON object above. No explanations, no markdown, no text before or after. Start directly with {{."""
    return system, user


def get_cof_prediction_prompt(history: List[Dict] = None, points: List[Dict] = None) -> Tuple[str, str]:
    """Prediction prompt for COF task (template with {history_json} and {points_json})."""
    system = SYSTEM_PROMPT
    
    # COF feature names (must match PARAM_NAMES order)
    cof_feature_names = [
        "pore_diameter", "void_fraction", "surface_area", "crystal_density",
        "B", "O", "C", "H", "Si", "N", "S", "P", "halogens", "metals"
    ]
    
    # If history and points are provided, directly format for backward compatibility
    if history is not None and points is not None:
        history_json = format_history_json(history, cof_feature_names)
        points_json = format_points_json(points, cof_feature_names)
    else:
        # Return template with placeholders (standard usage)
        history_json = "{history_json}"
        points_json = "{points_json}"
    
    user = """TASK = Predict Covalent Organic Framework (COF) Xe/Kr Separation Performance

Background:
- Optimizing Covalent Organic Framework (COF) materials for efficient Xe/Kr gas separation by tuning 14 key structural and compositional parameters.
- The objective is to MAXIMIZE gcmc_y — the Xe/Kr adsorption selectivity from Grand Canonical Monte Carlo (GCMC) high-fidelity simulations.
- A gcmc_y value greater than 1 indicates the material is more selective for Xe over Kr, with higher values indicating superior separation performance.
- All parameter values are in REAL, PHYSICAL UNITS (do NOT normalize, scale, or transform).
- Data-driven guidance from this dataset: higher gcmc_y is associated with smaller pores, lower void fraction, and higher crystalline density; surface area shows weak to slightly negative association at the very high end; elemental fractions exhibit generally weak and sparse effects.
-

Parameters (all REAL-valued in physical units, NOT normalized):
1) pore_diameter ∈ [3.5094, 56.3986] (Å, 1 Å = 0.1 nm) — Equivalent pore diameter. Physical meaning: Characteristic scale of the pore channels (accessible void size). Data trend: Strong negative association with gcmc_y.
2) void_fraction ∈ [0.1636, 0.9278] (dimensionless) — Porosity (volume fraction of voids). Physical meaning: Fraction of total material volume occupied by pores. Data trend: Strongest negative association with gcmc_y.
3) surface_area ∈ [1996.63, 6357.01] (m²/g) — Specific surface area. Physical meaning: Total internal/external surface per unit mass. Data trend: Weak to slightly negative overall; very high values (>~5000 m²/g) do not correspond to better selectivity.
4) crystal_density ∈ [102.7248, 1610.7018] (kg/m³) — Crystalline density. Physical meaning: Volume density of the solid framework. Data trend: Strong positive association with gcmc_y.
5) B ∈ [0.0000, 0.1818] (atomic fraction) — Boron atomic fraction. Data trend: Very weak/near-zero association. Secondary importance.
6) O ∈ [0.0000, 0.2500] (atomic fraction) — Oxygen atomic fraction. Data trend: Very weak negative association. Secondary importance.
7) C ∈ [0.3250, 0.6667] (atomic fraction) — Carbon atomic fraction. Data trend: Weak negative association. Secondary importance.
8) H ∈ [0.0000, 0.5000] (atomic fraction) — Hydrogen atomic fraction. Data trend: Weak positive association. Minor effect.
9) Si ∈ [0.0000, 0.0295] (atomic fraction) — Silicon atomic fraction. Data trend: Near-zero association. Secondary.
10) N ∈ [0.0000, 0.3333] (atomic fraction) — Nitrogen atomic fraction. Data trend: Very weak/unstable association. Secondary.
11) S ∈ [0.0000, 0.1429] (atomic fraction) — Sulfur atomic fraction. Data trend: Very weak association. Secondary.
12) P ∈ [0.0000, 0.0667] (atomic fraction) — Phosphorus atomic fraction. Data trend: Modest positive value but rank correlation is weak; treat as sparse/unstable signal.
13) halogens ∈ [0.0000, 0.2857] (atomic fraction) — Combined halogens (F/Cl/Br/I). Data trend: Very weak association. Secondary.
14) metals ∈ [0.0000, 0.0238] (atomic fraction) — Combined metal content. Data trend: Weak negative association. Secondary; most entries are zero.

You receive:
1. Historical reference measurements (use only for calibration, never repeat them).
2. A list of candidate COF compositions that require predictions.

Goal:
- For every candidate composition, output the predicted gcmc_y value using the exact input order [pore_diameter, void_fraction, surface_area, crystal_density, B, O, C, H, Si, N, S, P, halogens, metals].
- Ensure predictions are consistent with physical trade-offs observed in history.
- Valid performance range: gcmc_y ∈ [0.05, 18]; higher is better (values > 1 indicate Xe selectivity over Kr).

Historical Data (read-only context):
{history_json}

Predict These Points (return predictions in the same order):
{points_json}

REQUIRED OUTPUT FORMAT (exact schema):
{{
    "data_points": [
        {{
            "features": [pore_diameter, void_fraction, surface_area, crystal_density, B, O, C, H, Si, N, S, P, halogens, metals],
            "target": gcmc_y
        }},
        {{
            "features": [pore_diameter, void_fraction, surface_area, crystal_density, B, O, C, H, Si, N, S, P, halogens, metals],
            "target": gcmc_y
        }}
    ]
}}
Note: Include one entry in "data_points" for each input point, maintaining the exact same order.

CRITICAL FORMATTING REQUIREMENTS:
1. Output ONLY the JSON object. No text before or after. No explanations. No markdown formatting.
2. Response must be valid JSON with double quotes, no comments, and no trailing commas.
3. The root object must contain exactly one key: "data_points" (an array).
4. The "data_points" array must contain exactly one entry for each input point, in the same order as provided.
5. Each entry must be an object with exactly two keys:
   - "features": an array of exactly 14 numbers [pore_diameter, void_fraction, surface_area, crystal_density, B, O, C, H, Si, N, S, P, halogens, metals] in that exact order
   - "target": a single number (the predicted gcmc_y value, rounded to 3 decimals, clipped to [0.05, 18])
6. Do not include explanations, markdown, historical records, or any other keys or text outside the JSON object.
7. The number of entries in "data_points" must exactly match the number of input points provided.

IMPORTANT: Start your response directly with {{ and end with }}. No preamble."""
    return system, user



# ========== Sandwich task ==========
def get_sandwich_warmup_prompt(n_points: int = 5) -> Tuple[str, str]:
    """Warmup prompt for Sandwich task (generate initial points)."""
    system = SYSTEM_PROMPT
    
    user = f"""TASK = Sandwich/Food Combo Initial Point Generation

Background:
- This task optimizes a sandwich combo using continuous NON-normalized variables: the amount (g or ml) of each ingredient.
- Objective (single-target) ∈ [0,200] : Total_Score = Total_HEI_Score + Calorie_Score, where Total_HEI_Score ∈ [0,100] is computed from HEI-2020 scoring system based on nutrition components, Calorie_Score ∈ [0,100] rewards meals near 1200 kcal using a Gaussian distribution (peak at 1200 kcal, σ=150 kcal).

Parameters (all continuous, NON-normalized, in grams or ml):
1) multigrain_bread (g) ∈ [0.0, 140.0] — Multigrain bread amount. Contributes: moderate whole grains (15g/100g), high refined grains (35g/100g). Impact: Provides whole grains for HEI score but also adds refined grains (penalty).
2) whole_wheat_bread (g) ∈ [0.0, 140.0] — Whole wheat bread amount. Contributes: high whole grains (40g/100g), low refined grains (3g/100g). Impact: Strongly positive for HEI Whole Grains component (max 10 points). Optimization hint: This is the best bread choice for maximizing Whole Grains score.
3) sourdough_bread (g) ∈ [0.0, 140.0] — Sourdough bread amount. Contributes: low whole grains (10g/100g), high refined grains (35g/100g). Impact: Provides some whole grains but mostly refined grains (penalty).
4) chicken_protein (g) ∈ [0.0, 100.0] — Chicken protein amount. Contributes: total protein foods (18.4g/100g), moderate saturated fat. Impact: Positive for Total Protein Foods component (max 5 points). Optimization hint: Good protein source, more is good.
5) tuna_protein (g) ∈ [0.0, 100.0] — Tuna protein amount. Contributes: total protein foods (22g/100g), seafood/plant proteins (22g/100g), very low sodium. Impact: Positive for both Total Protein Foods (max 5 points) and Seafood/Plant Proteins (max 5 points). Optimization hint: Excellent choice for maximizing seafood protein score with minimal sodium.
6) tofu_protein (g) ∈ [0.0, 80.0] — Tofu protein amount. Contributes: total protein foods (17.6g/100g), seafood/plant proteins (17.6g/100g), vegetables (10g/100g), greens/beans (17.6g/100g). Impact: Positive for multiple HEI components (proteins and vegetables). Optimization hint: Highly beneficial for multiple HEI scores simultaneously.
7) hummus_protein (g) ∈ [0.0, 70.0] — Hummus protein amount. Contributes: total protein foods (7.35g/100g), seafood/plant proteins (7.35g/100g), greens/beans (7.35g/100g), moderate added sugars. Impact: Positive for proteins and greens/beans but adds some sugars.
8) egg_protein (g) ∈ [0.0, 80.0] — Egg protein amount. Contributes: total protein foods (12.4g/100g), moderate saturated fat (3.2g/100g). Impact: Positive for Total Protein Foods but adds saturated fat. Optimization hint: Use in moderation to balance protein needs with saturated fat limits.
9) low_fat_cheese_dairy (g) ∈ [0.0, 20.0] — Low-fat cheese dairy amount. Contributes: dairy (100g/100g), low saturated fat (1.36g/100g). Impact: Strongly positive for Dairy component (max 10 points) with minimal saturated fat penalty. Optimization hint: Best dairy choice for maximizing Dairy score while minimizing saturated fat.
10) cheddar_cheese (g) ∈ [0.0, 20.0] — Cheddar cheese amount. Contributes: dairy (100g/100g), very high saturated fat (21.4g/100g), high sodium (0.679g/100g). Impact: Positive for Dairy but strongly negative for Saturated Fats (max 10 points, lower is better) and Sodium (max 10 points, lower is better).
11) swiss_cheese_dairy (g) ∈ [0.0, 20.0] — Swiss cheese dairy amount. Contributes: dairy (100g/100g), high saturated fat (17.4g/100g), moderate sodium. Impact: Positive for Dairy but negative for Saturated Fats.
12) collards (g) ∈ [0.0, 80.0] — Collards amount. Contributes: total vegetables (100g/100g), greens/beans (100g/100g). Impact: Strongly positive for both Total Vegetables (max 5 points) and Greens/Beans (max 5 points). Optimization hint: Excellent choice for maximizing both vegetable-related HEI components.
13) cabbage (g) ∈ [0.0, 80.0] — Cabbage amount. Contributes: total vegetables (100g/100g), greens/beans (100g/100g). Impact: Strongly positive for both Total Vegetables and Greens/Beans. Optimization hint: Excellent choice for maximizing both vegetable-related HEI components.
14) onion_vegetables (g) ∈ [0.0, 80.0] — Onion vegetables amount. Contributes: total vegetables (100g/100g). Impact: Positive for Total Vegetables component. Optimization hint: Good for increasing Total Vegetables score.
15) tomato_vegetables (g) ∈ [0.0, 80.0] — Tomato vegetables amount. Contributes: total vegetables (100g/100g). Impact: Positive for Total Vegetables component. Optimization hint: Good for increasing Total Vegetables score.
16) mayo_sauce (g) ∈ [0.0, 15.0] — Mayonnaise sauce amount. Contributes: high sodium (2.2g/100g), high added sugars (13.3g/100g). Impact: Strongly negative for both Sodium (max 10 points, lower is better) and Added Sugars (max 10 points, lower is better). Optimization hint: Minimize usage; high penalties for both sodium and added sugars.
17) olive_oil (g) ∈ [0.0, 20.0] — Olive oil amount. Contributes: high monounsaturated fat (MUFA: 10.4g/100g), high polyunsaturated fat (PUFA: 66.6g/100g), moderate saturated fat (15.8g/100g). Impact: Positive for Fatty Acids ratio (PUFA+MUFA)/SFA (max 10 points, higher is better) but adds saturated fat. Optimization hint: Beneficial for improving Fatty Acids ratio, which improves HEI score.
18) apples (g) ∈ [0.0, 100.0] — Apples amount. Contributes: total fruits (100g/100g), whole fruits (100g/100g). Impact: Strongly positive for both Total Fruits (max 5 points) and Whole Fruits (max 5 points). Optimization hint: Excellent choice for maximizing both fruit-related HEI components.
19) orange (g) ∈ [0.0, 100.0] — Orange amount. Contributes: total fruits (100g/100g), whole fruits (100g/100g). Impact: Strongly positive for both Total Fruits and Whole Fruits. Optimization hint: Excellent choice for maximizing both fruit-related HEI components.
20) banana (g) ∈ [0.0, 100.0] — Banana amount. Contributes: total fruits (100g/100g), whole fruits (100g/100g). Impact: Strongly positive for both Total Fruits and Whole Fruits. Optimization hint: Excellent choice for maximizing both fruit-related HEI components.

Hard feasibility constraints (units must be respected; no normalization):
- All variables ≥ 0 (g or ml as named).
- Bread total: 60–140 g → multigrain_bread + whole_wheat_bread + sourdough_bread.
- Protein total: 60–150 g → chicken_protein + tuna_protein + tofu_protein + hummus_protein + egg_protein.
- Dairy total ≤ 40 g → low_fat_cheese_dairy + cheddar_cheese + swiss_cheese_dairy.
- Vegetables total ≥ 100 g → collards + cabbage + onion_vegetables + tomato_vegetables.
- Sauces+oil ≤ 25 g → mayo_sauce + olive_oil.
- Energy guardrails: target ~1200 kcal (hard bounds to avoid extreme solutions).

HEI-2020 Scoring Components (all normalized per 1000 kcal):
Adequacy Components (higher is better, max 100 points total):
- Total Fruits (5 points): Target ≥ 0.8 cup eq/1000kcal. Sources: apples, orange, banana.
- Whole Fruits (5 points): Target ≥ 0.4 cup eq/1000kcal. Sources: apples, orange, banana.
- Total Vegetables (5 points): Target ≥ 1.1 cup eq/1000kcal. Sources: collards, cabbage, onion_vegetables, tomato_vegetables, tofu_protein.
- Greens and Beans (5 points): Target ≥ 0.2 cup eq/1000kcal. Sources: collards, cabbage, tofu_protein, hummus_protein.
- Whole Grains (10 points): Target ≥ 1.5 oz eq/1000kcal. Sources: whole_wheat_bread (best), multigrain_bread, sourdough_bread.
- Dairy (10 points): Target ≥ 1.3 cup eq/1000kcal. Sources: low_fat_cheese_dairy (best), cheddar_cheese, swiss_cheese_dairy.
- Total Protein Foods (5 points): Target ≥ 2.5 oz eq/1000kcal. Sources: all protein options.
- Seafood and Plant Proteins (5 points): Target ≥ 0.8 oz eq/1000kcal. Sources: tuna_protein, tofu_protein, hummus_protein.
- Fatty Acids (10 points): Target (PUFA+MUFA)/SFA ≥ 2.5. Sources: olive_oil (best), avoid high saturated fat items like cheddar_cheese.

Objective:
- Maximize: Total_Score = Total_HEI_Score + Calorie_Score, where Total_HEI_Score ∈ [0,100] from 13 HEI components, Calorie_Score ∈ [0,100] peaks at ~1200 kcal.

Constraints:
- All parameters are continuous values ≥ 0, NOT normalized.
- Respect the feasibility constraints above (these MUST be satisfied first).
- Generate exactly {n_points} points, avoid near-duplicates, ensure suitability for BO initialization.
- Use the following simple design rules (keep things concise rather than overly complex):
  * Within breads, prefer more whole_wheat_bread and keep multigrain_bread and sourdough_bread lower, while still satisfying the bread total constraint.
  * Within proteins, try to use more chicken_protein, tuna_protein and egg_protein (while staying within the allowed protein total).
  * Keep dairy and cheese relatively low overall, especially cheddar_cheese and swiss_cheese_dairy.
  * Keep sauces small: minimize mayo_sauce and use only modest amounts of olive_oil.

OUTPUT FORMAT:
{{
    "points": [
        {{"multigrain_bread": V1, "whole_wheat_bread": V2, "sourdough_bread": V3, "chicken_protein": V4, "tuna_protein": V5, "tofu_protein": V6, "hummus_protein": V7, "egg_protein": V8, "low_fat_cheese_dairy": V9, "cheddar_cheese": V10, "swiss_cheese_dairy": V11, "collards": V12, "cabbage": V13, "onion_vegetables": V14, "tomato_vegetables": V15, "mayo_sauce": V16, "olive_oil": V17, "apples": V18, "orange": V19, "banana": V20}},
        ...
    ]
}}

CRITICAL: Output ONLY the JSON object above. No explanations, no markdown, no text before or after. Start directly with {{."""
    return system, user


def get_sandwich_prediction_prompt(history: List[Dict] = None, points: List[Dict] = None) -> Tuple[str, str]:
    """Prediction prompt for Sandwich task (template with {history_json} and {points_json})."""
    system = SYSTEM_PROMPT
    
    sandwich_feature_names = [
        "multigrain_bread", "whole_wheat_bread", "sourdough_bread",
        "chicken_protein", "tuna_protein", "tofu_protein", "hummus_protein", "egg_protein",
        "low_fat_cheese_dairy", "cheddar_cheese", "swiss_cheese_dairy",
        "collards", "cabbage", "onion_vegetables", "tomato_vegetables",
        "mayo_sauce", "olive_oil",
        "apples", "orange", "banana"
    ]
    
    # If history and points are provided, directly format for backward compatibility
    if history is not None and points is not None:
        history_json = format_history_json(history, sandwich_feature_names)
        points_json = format_points_json(points, sandwich_feature_names)
    else:
        # Return template with placeholders (standard usage)
        history_json = "{{history_json}}"
        points_json = "{{points_json}}"
    
    user = """TASK = Predict Sandwich/Food Combo Performance

Background:
- Optimizing a food/sandwich combo using continuous NON-normalized variables: the amount (g or ml) of each ingredient.
- Objective (single-target): Total_Score = Total_HEI_Score + Calorie_Score, where Total_HEI_Score ∈ [0,100] is computed from HEI-2020 scoring system based on 13 nutrition components, Calorie_Score ∈ [0,100] rewards meals near 1200 kcal using a Gaussian distribution (peak at 1200 kcal, σ=150 kcal).
- The HEI-2020 scoring system evaluates 13 nutrition components (9 adequacy components: higher is better; 4 moderation components: lower is better). All components are normalized per 1000 kcal.
- The energy-centered Gaussian term rewards staying near 1200 kcal while HEI covers overall diet quality.
HEI-2020 Scoring Components (all normalized per 1000 kcal):
Adequacy Components (higher is better, max 100 points total):
- Total Fruits (5 points): Target ≥ 0.8 cup eq/1000kcal. Sources: apples, orange, banana. Linear scoring from 0 to max when below target.
- Whole Fruits (5 points): Target ≥ 0.4 cup eq/1000kcal. Sources: apples, orange, banana. Linear scoring from 0 to max when below target.
- Total Vegetables (5 points): Target ≥ 1.1 cup eq/1000kcal. Sources: collards, cabbage, onion_vegetables, tomato_vegetables, tofu_protein. Linear scoring from 0 to max when below target.
- Greens and Beans (5 points): Target ≥ 0.2 cup eq/1000kcal. Sources: collards, cabbage, tofu_protein, hummus_protein. Linear scoring from 0 to max when below target.
- Whole Grains (10 points): Target ≥ 1.5 oz eq/1000kcal. Sources: whole_wheat_bread (best: 40g/100g), multigrain_bread (15g/100g), sourdough_bread (10g/100g). Linear scoring from 0 to max when below target.
- Dairy (10 points): Target ≥ 1.3 cup eq/1000kcal. Sources: low_fat_cheese_dairy (best), cheddar_cheese, swiss_cheese_dairy. Linear scoring from 0 to max when below target.
- Total Protein Foods (5 points): Target ≥ 2.5 oz eq/1000kcal. Sources: all protein options. Linear scoring from 0 to max when below target.
- Seafood and Plant Proteins (5 points): Target ≥ 0.8 oz eq/1000kcal. Sources: tuna_protein (22g/100g), tofu_protein (17.6g/100g), hummus_protein (7.35g/100g). Linear scoring from 0 to max when below target.
- Fatty Acids (10 points): Target (PUFA+MUFA)/SFA ≥ 2.5. Sources: olive_oil (best: high PUFA+MUFA), avoid high saturated fat items like cheddar_cheese. Linear scoring from 1.2 to max when below target.


Parameters (all continuous, NON-normalized, in grams or ml):
1) multigrain_bread (g) ∈ [0.0, 140.0] — Multigrain bread amount. Contributes: moderate whole grains (15g/100g), high refined grains (35g/100g). Impact: Provides whole grains for HEI score but also adds refined grains (penalty). Optimization hint: Prefer whole_wheat_bread over multigrain_bread for better HEI balance.
2) whole_wheat_bread (g) ∈ [0.0, 140.0] — Whole wheat bread amount. Contributes: high whole grains (40g/100g), low refined grains (3g/100g). Impact: Strongly positive for HEI Whole Grains component (max 10 points). Optimization hint: This is the best bread choice for maximizing Whole Grains score.
3) sourdough_bread (g) ∈ [0.0, 140.0] — Sourdough bread amount. Contributes: low whole grains (10g/100g), high refined grains (35g/100g). Impact: Provides some whole grains but mostly refined grains (penalty). Optimization hint: Lower amounts preferred to minimize refined grains penalty.
4) chicken_protein (g) ∈ [0.0, 100.0] — Chicken protein amount. Contributes: total protein foods (18.4g/100g), moderate saturated fat. Impact: Positive for Total Protein Foods component (max 5 points). Optimization hint: Good protein source, more is good.
5) tuna_protein (g) ∈ [0.0, 100.0] — Tuna protein amount. Contributes: total protein foods (22g/100g), seafood/plant proteins (22g/100g), very low sodium. Impact: Positive for both Total Protein Foods (max 5 points) and Seafood/Plant Proteins (max 5 points). Optimization hint: Excellent choice for maximizing seafood protein score with minimal sodium.
6) tofu_protein (g) ∈ [0.0, 80.0] — Tofu protein amount. Contributes: total protein foods (17.6g/100g), seafood/plant proteins (17.6g/100g), vegetables (10g/100g), greens/beans (17.6g/100g). Impact: Positive for multiple HEI components (proteins and vegetables). Optimization hint: Highly beneficial for multiple HEI scores simultaneously.
7) hummus_protein (g) ∈ [0.0, 70.0] — Hummus protein amount. Contributes: total protein foods (7.35g/100g), seafood/plant proteins (7.35g/100g), greens/beans (7.35g/100g), moderate added sugars. Impact: Positive for proteins and greens/beans but adds some sugars. Optimization hint: Beneficial for plant proteins and greens/beans components.
8) egg_protein (g) ∈ [0.0, 80.0] — Egg protein amount. Contributes: total protein foods (12.4g/100g), moderate saturated fat (3.2g/100g). Impact: Positive for Total Protein Foods but adds saturated fat. Optimization hint: Use in moderation to balance protein needs with saturated fat limits.
9) low_fat_cheese_dairy (g) ∈ [0.0, 20.0] — Low-fat cheese dairy amount. Contributes: dairy (100g/100g), low saturated fat (1.36g/100g). Impact: Strongly positive for Dairy component (max 10 points) with minimal saturated fat penalty. Optimization hint: Best dairy choice for maximizing Dairy score while minimizing saturated fat.
10) cheddar_cheese (g) ∈ [0.0, 20.0] — Cheddar cheese amount. Contributes: dairy (100g/100g), very high saturated fat (21.4g/100g), high sodium (0.679g/100g). Impact: Positive for Dairy but strongly negative for Saturated Fats (max 10 points, lower is better) and Sodium (max 10 points, lower is better). Optimization hint: Use sparingly; high saturated fat and sodium penalties outweigh dairy benefits.
11) swiss_cheese_dairy (g) ∈ [0.0, 20.0] — Swiss cheese dairy amount. Contributes: dairy (100g/100g), high saturated fat (17.4g/100g), moderate sodium. Impact: Positive for Dairy but negative for Saturated Fats. Optimization hint: Better than cheddar for saturated fat, but low_fat_cheese_dairy is preferred.
12) collards (g) ∈ [0.0, 80.0] — Collards amount. Contributes: total vegetables (100g/100g), greens/beans (100g/100g). Impact: Strongly positive for both Total Vegetables (max 5 points) and Greens/Beans (max 5 points). Optimization hint: Excellent choice for maximizing both vegetable-related HEI components.
13) cabbage (g) ∈ [0.0, 80.0] — Cabbage amount. Contributes: total vegetables (100g/100g), greens/beans (100g/100g). Impact: Strongly positive for both Total Vegetables and Greens/Beans. Optimization hint: Excellent choice for maximizing both vegetable-related HEI components.
14) onion_vegetables (g) ∈ [0.0, 80.0] — Onion vegetables amount. Contributes: total vegetables (100g/100g). Impact: Positive for Total Vegetables component. Optimization hint: Good for increasing Total Vegetables score.
15) tomato_vegetables (g) ∈ [0.0, 80.0] — Tomato vegetables amount. Contributes: total vegetables (100g/100g). Impact: Positive for Total Vegetables component. Optimization hint: Good for increasing Total Vegetables score.
16) mayo_sauce (g) ∈ [0.0, 15.0] — Mayonnaise sauce amount. Contributes: high sodium (2.2g/100g), high added sugars (13.3g/100g). Impact: Strongly negative for both Sodium (max 10 points, lower is better) and Added Sugars (max 10 points, lower is better). Optimization hint: Minimize usage; high penalties for both sodium and added sugars.
17) olive_oil (g) ∈ [0.0, 20.0] — Olive oil amount. Contributes: high monounsaturated fat (MUFA: 10.4g/100g), high polyunsaturated fat (PUFA: 66.6g/100g), moderate saturated fat (15.8g/100g). Impact: Positive for Fatty Acids ratio (PUFA+MUFA)/SFA (max 10 points, higher is better) but adds saturated fat. Optimization hint: Beneficial for improving Fatty Acids ratio, which improves HEI score.
18) apples (g) ∈ [0.0, 100.0] — Apples amount. Contributes: total fruits (100g/100g), whole fruits (100g/100g). Impact: Strongly positive for both Total Fruits (max 5 points) and Whole Fruits (max 5 points). Optimization hint: Excellent choice for maximizing both fruit-related HEI components.
19) orange (g) ∈ [0.0, 100.0] — Orange amount. Contributes: total fruits (100g/100g), whole fruits (100g/100g). Impact: Strongly positive for both Total Fruits and Whole Fruits. Optimization hint: Excellent choice for maximizing both fruit-related HEI components.
20) banana (g) ∈ [0.0, 100.0] — Banana amount. Contributes: total fruits (100g/100g), whole fruits (100g/100g). Impact: Strongly positive for both Total Fruits and Whole Fruits. Optimization hint: Excellent choice for maximizing both fruit-related HEI components.

You receive:
1. Historical reference measurements (use only for calibration, never repeat them).
2. A list of candidate food combinations that require predictions.

Goal:
- For every candidate combination, output the predicted Total_Score value using the exact input order [multigrain_bread, whole_wheat_bread, sourdough_bread, chicken_protein, tuna_protein, tofu_protein, hummus_protein, egg_protein, low_fat_cheese_dairy, cheddar_cheese, swiss_cheese_dairy, collards, cabbage, onion_vegetables, tomato_vegetables, mayo_sauce, olive_oil, apples, orange, banana].
- Ensure predictions are consistent with physical trade-offs observed in history.
- Consider HEI scoring trends:
  * Higher Total_Score benefits from maximizing adequacy components: whole grains (prefer whole_wheat_bread), fruits (apples/orange/banana), vegetables (collards/cabbage for dual benefits), proteins (tuna/tofu for dual benefits), dairy (prefer low_fat_cheese_dairy), healthy fats (olive_oil for fatty acids ratio).
  * Higher Total_Score requires minimizing moderation components: refined grains (minimize multigrain_bread/sourdough_bread), sodium (minimize mayo_sauce/cheddar_cheese), added sugars (minimize mayo_sauce), saturated fats (minimize cheddar_cheese/swiss_cheese_dairy).
  * Energy near 1200 kcal maximizes Calorie_Score (Gaussian peak).
- Trade-offs: High energy (>~1350 kcal) reduces energy-centered reward; excessive moderation components (refined grains, sodium, sugars, saturated fats) significantly reduce HEI score; balance adequacy and moderation while targeting ~1200 kcal.
- Valid performance range: Total_Score typically ranges from 0 to ~200 (Total_HEI_Score max 100 + Calorie_Score max ~100); higher is better.

Historical Data (read-only context):
{history_json}

Predict These Points (return predictions in the same order):
{points_json}

REQUIRED OUTPUT FORMAT (exact schema):
{{
    "data_points": [
        {{
            "features": [multigrain_bread, whole_wheat_bread, sourdough_bread, chicken_protein, tuna_protein, tofu_protein, hummus_protein, egg_protein, low_fat_cheese_dairy, cheddar_cheese, swiss_cheese_dairy, collards, cabbage, onion_vegetables, tomato_vegetables, mayo_sauce, olive_oil, apples, orange, banana],
            "target": Total_Score
        }},
        {{
            "features": [multigrain_bread, whole_wheat_bread, sourdough_bread, chicken_protein, tuna_protein, tofu_protein, hummus_protein, egg_protein, low_fat_cheese_dairy, cheddar_cheese, swiss_cheese_dairy, collards, cabbage, onion_vegetables, tomato_vegetables, mayo_sauce, olive_oil, apples, orange, banana],
            "target": Total_Score
        }}
    ]
}}
Note: Include one entry in "data_points" for each input point, maintaining the exact same order.

CRITICAL FORMATTING REQUIREMENTS:
1. Output ONLY the JSON object. No text before or after. No explanations. No markdown formatting.
2. Response must be valid JSON with double quotes, no comments, and no trailing commas.
3. The root object must contain exactly one key: "data_points" (an array).
4. The "data_points" array must contain exactly one entry for each input point, in the same order as provided.
5. Each entry must be an object with exactly two keys:
   - "features": an array of exactly 20 numbers [multigrain_bread, whole_wheat_bread, sourdough_bread, chicken_protein, tuna_protein, tofu_protein, hummus_protein, egg_protein, low_fat_cheese_dairy, cheddar_cheese, swiss_cheese_dairy, collards, cabbage, onion_vegetables, tomato_vegetables, mayo_sauce, olive_oil, apples, orange, banana] in that exact order
   - "target": a single number (the predicted Total_Score value, rounded to 3 decimals)
6. Do not include explanations, markdown, historical records, or any other keys or text outside the JSON object.
7. The number of entries in "data_points" must exactly match the number of input points provided.

IMPORTANT: Start your response directly with {{ and end with }}. No preamble."""
    return system, user


# ========== PCE10 task ==========
def get_pce10_warmup_prompt(n_points: int = 5) -> Tuple[str, str]:
    """Warmup prompt for PCE10 task (generate initial formulation points)."""
    system = SYSTEM_PROMPT
    
    user = f"""TASK = Quaternary OPV Blend Initial Point Generation (Photostability)

Background:
- This task studies photodegradation of quaternary organic photovoltaic (OPV) active-layer blends under light exposure.
- The blend consists of four components whose weight fractions MUST sum to 1.0:
  1) PCE10  — polymer donor (less photostable)
  2) P3HT   — polymer donor (more photostable, stabilizing)
  3) PCBM   — fullerene acceptor
  4) olDTBR — non-fullerene acceptor (oIDTBR)

Objective:
- Provide diverse, BO-friendly initial compositions that explore the design space
  while remaining physically meaningful for OPV devices.
- The downstream optimization target is LOW degradation (higher photostability).

Key scientific priors (use as guidance, not as hard rules):
- Photodegradation in quaternary OPV blends is influenced by component interactions
  and composition-dependent stability mechanisms.
- Different donor and acceptor components exhibit varying photostability characteristics.
- Component interactions can lead to non-linear degradation behavior.

Parameters (weight fractions; keep exact order):
- PCE10 ∈ [0.00, 1.00]
- P3HT  ∈ [0.00, 1.00]
- PCBM  ∈ [0.00, 1.00]
- olDTBR ∈ [0.00, 1.00]

Hard feasibility constraints:
1) Sum-to-one constraint:
   PCE10 + P3HT + PCBM + olDTBR = 1.00 exactly.
2) Resolution constraint:
   Each fraction MUST be a multiple of 0.02.
3) OPV donor–acceptor constraint:
   Donor = PCE10 + P3HT
   Acceptor = PCBM + olDTBR
   Enforce Donor/Acceptor ∈ [0.2, 5.0].
   (Do not output all-donor or all-acceptor compositions.)

Design requirements:
- Generate exactly {n_points} points.
- Avoid duplicates and near-duplicates.
- Ensure diversity across the composition space.

OUTPUT FORMAT:
{{
  "points": [
    {{"PCE10": a1, "P3HT": b1, "PCBM": c1, "olDTBR": d1}},
    {{"PCE10": a2, "P3HT": b2, "PCBM": c2, "olDTBR": d2}}
  ]
}}

CRITICAL: Output ONLY the JSON object above.
No explanations, no markdown, no text before or after."""
    return system, user


def get_pce10_prediction_prompt(history: List[Dict] = None, points: List[Dict] = None) -> Tuple[str, str]:
    """Prediction prompt for PCE10 task (returns template or filled prompt)."""
    system = SYSTEM_PROMPT
    
    # PCE10 feature names (must match PARAM_NAMES order)
    pce10_feature_names = ["PCE10", "P3HT", "PCBM", "olDTBR"]
    
    # If history and points are provided, directly format for backward compatibility
    if history is not None and points is not None:
        history_json = format_history_json(history, pce10_feature_names)
        points_json = format_points_json(points, pce10_feature_names)
    else:
        # Return template with placeholders (standard usage)
        history_json = "{history_json}"
        points_json = "{points_json}"
    
    user = """TASK = Predict Quaternary OPV Blend Degradation (Photostability)

Background:
- Optimizing quaternary organic photovoltaic (OPV) active-layer blends for photostability by tuning four key compositional parameters.
- The objective is to MINIMIZE degradation — a critical metric measuring photodegradation after light exposure in air, directly influencing device lifetime and performance retention.
- Valid performance range: degradation ∈ [0.0, 0.75]; lower is better.
- All parameter values are in REAL, PHYSICAL UNITS (do NOT normalize, scale, or transform).
-

Parameters (all REAL-valued in physical units, NOT normalized):
1) PCE10 ∈ [0.00, 1.00] (weight fraction) — Polymer donor (less photostable). Physical meaning: Weight fraction of PCE10 polymer donor in the quaternary blend. Data trend: PCE10-rich blends are more prone to degradation, especially with mixed acceptors; lacks the stabilization effect of P3HT.
2) P3HT ∈ [0.00, 1.00] (weight fraction) — Polymer donor (more photostable, stabilizing). Physical meaning: Weight fraction of P3HT polymer donor in the quaternary blend. Data trend: P3HT generally stabilizes the system and tends to reduce degradation.
3) PCBM ∈ [0.00, 1.00] (weight fraction) — Fullerene acceptor. Physical meaning: Weight fraction of PCBM fullerene acceptor in the quaternary blend. Data trend: Strong interaction with olDTBR; degradation increases monotonically with min(PCBM, olDTBR); single-acceptor systems (PCBM dominant, olDTBR≈0) show low degradation (≈0.13 average); balanced PCBM-olDTBR mixing leads to degradation >0.4.
4) olDTBR ∈ [0.00, 1.00] (weight fraction) — Non-fullerene acceptor (oIDTBR). Physical meaning: Weight fraction of olDTBR non-fullerene acceptor in the quaternary blend. Data trend: Strong interaction with PCBM; degradation increases monotonically with min(PCBM, olDTBR); single-acceptor systems (olDTBR dominant, PCBM≈0) show low degradation; balanced PCBM-olDTBR mixing leads to degradation >0.4.

You receive:
1. Historical reference measurements (use only for calibration, never repeat them).
2. A list of candidate OPV blend compositions that require predictions.

Goal:
- For every candidate composition, output the predicted degradation value using the exact input order [PCE10, P3HT, PCBM, olDTBR].
- Ensure predictions are consistent with physical trade-offs observed in history.
- Valid performance range: degradation ∈ [0.0, 0.75]; lower is better.

Historical Data (read-only context):
{history_json}

Predict These Points (return predictions in the same order):
{points_json}

REQUIRED OUTPUT FORMAT (exact schema):
{{
    "data_points": [
        {{
            "features": [PCE10, P3HT, PCBM, olDTBR],
            "target": degradation
        }},
        {{
            "features": [PCE10, P3HT, PCBM, olDTBR],
            "target": degradation
        }}
    ]
}}
Note: Include one entry in "data_points" for each input point, maintaining the exact same order.

CRITICAL FORMATTING REQUIREMENTS:
1. Output ONLY the JSON object. No text before or after. No explanations. No markdown formatting.
2. Response must be valid JSON with double quotes, no comments, and no trailing commas.
3. The root object must contain exactly one key: "data_points" (an array).
4. The "data_points" array must contain exactly one entry for each input point, in the same order as provided.
5. Each entry must be an object with exactly two keys:
   - "features": an array of exactly 4 numbers [PCE10, P3HT, PCBM, olDTBR] in that exact order
   - "target": a single number (the predicted degradation value, rounded to 3 decimals, clipped to [0.0, 0.75])
6. Do not include explanations, markdown, historical records, or any other keys or text outside the JSON object.
7. The number of entries in "data_points" must exactly match the number of input points provided.

IMPORTANT: Start your response directly with {{ and end with }}. No preamble."""
    return system, user


# ========== Fullerene task ==========
def get_fullerene_warmup_prompt(n_points: int = 5) -> Tuple[str, str]:
    """Warmup prompt for Fullerene task (generate initial reaction conditions)."""
    system = SYSTEM_PROMPT

    user = f"""TASK = Fullerene C60 Cascadic Reaction Initial Point Generation

Background:
- This task studies a cascadic reaction forming o-xylenyl adducts of C60:
  C60 → X1 → X2 → X3 → ...
- First- and second-order adducts (X1, X2) are technologically useful.
- Higher-order adducts (X3 and above) are undesirable and should be suppressed.

Objective:
- Maximize the mole fraction of useful adducts (X1 + X2) by providing diverse, 
  BO-friendly initial reaction conditions that explore the design space.

Parameters (REAL values, NOT normalized; keep exact order):
1) reaction_time (min) ∈ [3, 31]
2) sultine_conc ∈ [1.5, 6.0]
3) temperature (°C) ∈ [100, 150]

Key physical priors (use as guidance):
- Increasing temperature, reaction time, or sultine concentration
  drives the reaction toward higher-order adducts (X3+).
- The strongest increase in X3 occurs when ALL THREE parameters
  are simultaneously high.
- Low temperature and low sultine concentration strongly suppress X3,
  even at moderate reaction times.
- Moderate parameter values tend to maximize useful adducts (X1 + X2).

Constraints:
- All parameters are continuous REAL values in physical units (do NOT normalize).
- Each parameter must be within its specified range.
- Generate exactly {n_points} points.
- Avoid duplicates and near-duplicates.

Design requirements:
- Ensure diversity across the reaction space.
- Include:
  * at least one low-severity point (low temperature, low sultine concentration)
  * at least one moderate point (balanced parameters)
  * at least one exploratory high-severity point
    (higher temperature and/or sultine concentration, but not all parameters maximal).

OUTPUT FORMAT:
{{
    "points": [
        {{"reaction_time": t1, "sultine_conc": s1, "temperature": T1}},
        {{"reaction_time": t2, "sultine_conc": s2, "temperature": T2}}
    ]
}}

CRITICAL: Output ONLY the JSON object above. No explanations, no markdown, no text before or after. Start directly with {{."""
    return system, user


def get_fullerene_prediction_prompt(history: List[Dict] = None,
                                    points: List[Dict] = None) -> Tuple[str, str]:
    """Prediction prompt for Fullerene task (returns template or filled prompt)."""
    system = SYSTEM_PROMPT

    feature_names = ["reaction_time", "sultine_conc", "temperature"]

    if history is not None and points is not None:
        history_json = format_history_json(history, feature_names)
        points_json = format_points_json(points, feature_names)
    else:
        history_json = "{history_json}"
        points_json = "{points_json}"

    user = """TASK = Predict Fullerene C60 Useful Adduct Mole Fraction

Background:
- Optimizing a cascadic reaction forming o-xylenyl adducts of C60 (C60 → X1 → X2 → X3 → ...) by tuning three key reaction parameters.
- The objective is to MAXIMIZE mole_fraction — the mole fraction of useful adducts (X1 + X2), directly influencing product selectivity and yield.
- Valid performance range: mole_fraction ∈ [0.0, 1.0]; higher is better.
- First- and second-order adducts (X1, X2) are technologically useful; higher-order adducts (X3+) are undesirable.
- All parameter values are in REAL, PHYSICAL UNITS (do NOT normalize, scale, or transform).
- Data-driven guidance from this dataset: mole_fraction exhibits strong nonlinear dependence on reaction conditions. High temperature, high sultine concentration, and long reaction time act synergistically to reduce mole_fraction. At low temperature, reactions remain effectively limited to low-order stages; even with moderate reaction time and sultine concentration, mole_fraction can remain high. The system does not follow single-parameter linear laws but is a cascadic reaction response surface determined jointly by temperature, reaction time, and reactant ratio.

Parameters (all REAL-valued in physical units, NOT normalized):
1) reaction_time ∈ [3, 31] (min) — Reaction duration. Physical meaning: Time allowed for the cascadic reaction to proceed. Data trend: At low temperature, useful adducts remain high even for moderate-to-long times; at high temperature, long reaction times (>~25 min) combined with high sultine concentration lead to severe cascading and low mole_fraction.
2) sultine_conc ∈ [1.5, 6.0] (dimensionless) — Sultine concentration. Physical meaning: Concentration of sultine reactant in the reaction mixture. Data trend: High concentration (6.0) combined with high temperature and long time drives cascading to higher-order adducts; moderate concentration (~4.2) at low temperature maintains high mole_fraction; stronger influence than reaction time.
3) temperature ∈ [100, 150] (°C) — Reaction temperature. Physical meaning: Temperature at which the cascadic reaction occurs. Data trend: Strongest influence on selectivity; low temperature tends to limit reaction to low-order stages and maintain higher mole_fraction, while high temperature combined with high sultine concentration and long time can drive cascading to higher-order adducts and reduce mole_fraction.

You receive:
1. Historical reference measurements (use only for calibration, never repeat them).
2. A list of candidate reaction conditions that require predictions.

Goal:
- For every candidate condition, output the predicted mole_fraction value using the exact input order [reaction_time, sultine_conc, temperature].
- Ensure predictions are consistent with physical trade-offs observed in history.
- Valid performance range: mole_fraction ∈ [0.0, 1.0]; higher is better.

Historical Data (read-only context):
{history_json}

Predict These Points (return predictions in the same order):
{points_json}

REQUIRED OUTPUT FORMAT (exact schema):
{{
    "data_points": [
        {{
            "features": [reaction_time, sultine_conc, temperature],
            "target": mole_fraction
        }},
        {{
            "features": [reaction_time, sultine_conc, temperature],
            "target": mole_fraction
        }}
    ]
}}
Note: Include one entry in "data_points" for each input point, maintaining the exact same order.

CRITICAL FORMATTING REQUIREMENTS:
1. Output ONLY the JSON object. No text before or after. No explanations. No markdown formatting.
2. Response must be valid JSON with double quotes, no comments, and no trailing commas.
3. The root object must contain exactly one key: "data_points" (an array).
4. The "data_points" array must contain exactly one entry for each input point, in the same order as provided.
5. Each entry must be an object with exactly two keys:
   - "features": an array of exactly 3 numbers [reaction_time, sultine_conc, temperature] in that exact order
   - "target": a single number (the predicted mole_fraction value, rounded to 3 decimals, clipped to [0.0, 1.0])
6. Do not include explanations, markdown, historical records, or any other keys or text outside the JSON object.
7. The number of entries in "data_points" must exactly match the number of input points provided.

IMPORTANT: Start your response directly with {{ and end with }}. No preamble."""
    return system, user


# ========== P3HT task ==========
def get_p3ht_warmup_prompt(n_points: int = 5) -> Tuple[str, str]:
    """Warmup prompt for P3HT/CNT task (generate initial formulation points)."""
    system = SYSTEM_PROMPT

    user = f"""TASK = P3HT/CNT Composite Initial Point Generation (Drop Casting)

Background:
- This task optimizes drop-cast P3HT/CNT composite thin films for electrical conductivity.
- The formulation consists of one polymer matrix (P3HT) and four types of carbon nanotubes (CNTs).
- Electrical conductivity arises from the formation of percolating CNT networks within the P3HT matrix.

Parameters (continuous, REAL-valued percentages; keep exact order as declared):
1) p3ht_content  — rr-P3HT polymer content ∈ [10, 100]
2) d1_content    — l-SWNT content ∈ [0, 60]
3) d2_content    — s-SWNT content ∈ [0, 70]
4) d6_content    — MWCNT content ∈ [0, 85]
5) d8_content    — DWCNT content ∈ [0, 75]

Objective:
- Maximize electrical conductivity by proposing diverse, BO-friendly initial compositions.

Key scientific priors (use as guidance, not as hard rules):
- Conductivity in polymer–CNT composites is strongly non-linear and often governed by
  percolation behavior of CNT networks.
- Different CNT types contribute differently to conductivity due to differences in
  aspect ratio, dispersion, and network connectivity.
- Excessively high total CNT loading may degrade conductivity due to aggregation,
  poor dispersion, or film discontinuities.
- Balanced or mixed CNT formulations can outperform single-CNT systems due to
  synergistic network formation.

Constraints:
- All parameters are continuous REAL values in percentage units (do NOT normalize).
- Hard constraint: p3ht_content + d1_content + d2_content + d6_content + d8_content = 100.0 exactly.
- Each parameter must be within its specified range.
- Generate exactly {n_points} points.
- Avoid duplicates and near-duplicates.

Design requirements:
- Ensure diversity across:
  * polymer-rich vs CNT-rich regimes
  * single-CNT-dominant vs mixed-CNT formulations
- Include:
  * at least one polymer-rich / low-CNT point (below percolation)
  * at least one mixed-CNT point (multiple d* non-zero)
  * at least one exploratory CNT-rich point (but avoid all CNTs simultaneously maximal)

OUTPUT FORMAT:
{{
  "points": [
    {{"p3ht_content": x1, "d1_content": x2, "d2_content": x3, "d6_content": x4, "d8_content": x5}},
    {{"p3ht_content": y1, "d1_content": y2, "d2_content": y3, "d6_content": y4, "d8_content": y5}}
  ]
}}

CRITICAL: Output ONLY the JSON object above.
No explanations, no markdown, no text before or after."""
    return system, user


def get_p3ht_prediction_prompt(history: List[Dict] = None,
                               points: List[Dict] = None) -> Tuple[str, str]:
    """Prediction prompt for P3HT/CNT task (returns template or filled prompt)."""
    system = SYSTEM_PROMPT

    feature_names = [
        "p3ht_content",
        "d1_content",
        "d2_content",
        "d6_content",
        "d8_content"
    ]

    if history is not None and points is not None:
        history_json = format_history_json(history, feature_names)
        points_json = format_points_json(points, feature_names)
    else:
        history_json = "{history_json}"
        points_json = "{points_json}"

    user = """TASK = Predict P3HT/CNT Composite Electrical Conductivity (Drop Casting)

Background:
- Optimizing drop-cast P3HT/CNT composite thin films for electrical conductivity by tuning five key compositional parameters.
- The objective is to MAXIMIZE electrical conductivity — a critical metric for electronic device performance, directly influencing charge transport efficiency and device functionality.
- All parameter values are in REAL, PHYSICAL UNITS (do NOT normalize, scale, or transform).
- Data-driven guidance from this dataset: conductivity exhibits strong nonlinear dependence on composition; balanced polymer/CNT loading with sufficient l-SWNT content and limited amounts of other CNT types generally leads to higher conductivity, while excessive polymer or excessive total CNT loading can degrade performance.

Parameters (all REAL-valued in physical units, NOT normalized):
1) p3ht_content ∈ [10, 100] (%) — rr-P3HT polymer content. Physical meaning: The mass percentage of regioregular poly(3-hexylthiophene) polymer matrix forming the composite film. Data trend: Moderate values (40–50%) are optimal; excessive content (>~60%) suppresses CNT connectivity and reduces conductivity.
2) d1_content ∈ [0, 60] (%) — l-SWNT carbon nanotube content. Physical meaning: The mass percentage of long single-walled carbon nanotubes (l-SWNT) in the composite. Data trend: Strong positive association with conductivity when in the 50–60% range; insufficient content (<~40%) leads to low conductivity.
3) d2_content ∈ [0, 70] (%) — s-SWNT carbon nanotube content. Physical meaning: The mass percentage of short single-walled carbon nanotubes (s-SWNT) in the composite. Data trend: Large fractions can reduce conductivity; small fractions are often preferable.
4) d6_content ∈ [0, 85] (%) — MWCNT carbon nanotube content. Physical meaning: The mass percentage of multi-walled carbon nanotubes (MWCNT) in the composite. Data trend: Large fractions can reduce conductivity; moderate or low fractions are often preferable.
5) d8_content ∈ [0, 75] (%) — DWCNT carbon nanotube content. Physical meaning: The mass percentage of double-walled carbon nanotubes (DWCNT) in the composite. Data trend: Plays a secondary role relative to l-SWNT, with smaller fractions generally more favorable for high conductivity.

You receive:
1. Historical reference measurements (use only for calibration, never repeat them).
2. A list of candidate P3HT/CNT compositions that require predictions.

Goal:
- For every candidate composition, output the predicted conductivity value using the exact input order [p3ht_content, d1_content, d2_content, d6_content, d8_content].
- Ensure predictions are consistent with physical trade-offs observed in history.
- Valid performance range: conductivity ∈ [0.0, 1250.0] (S/cm); higher is better.

Historical Data (read-only context):
{history_json}

Predict These Points (return predictions in the same order):
{points_json}

REQUIRED OUTPUT FORMAT (exact schema):
{{
    "data_points": [
        {{
            "features": [p3ht_content, d1_content, d2_content, d6_content, d8_content],
            "target": conductivity
        }},
        {{
            "features": [p3ht_content, d1_content, d2_content, d6_content, d8_content],
            "target": conductivity
        }}
    ]
}}
Note: Include one entry in "data_points" for each input point, maintaining the exact same order.

CRITICAL FORMATTING REQUIREMENTS:
1. Output ONLY the JSON object. No text before or after. No explanations. No markdown formatting.
2. Response must be valid JSON with double quotes, no comments, and no trailing commas.
3. The root object must contain exactly one key: "data_points" (an array).
4. The "data_points" array must contain exactly one entry for each input point, in the same order as provided.
5. Each entry must be an object with exactly two keys:
   - "features": an array of exactly 5 numbers [p3ht_content, d1_content, d2_content, d6_content, d8_content] in that exact order
   - "target": a single number (the predicted conductivity value, rounded to 3 decimals, clipped to [0.0, 1250.0])
6. Do not include explanations, markdown, historical records, or any other keys or text outside the JSON object.
7. The number of entries in "data_points" must exactly match the number of input points provided.

IMPORTANT: Start your response directly with {{ and end with }}. No preamble."""
    return system, user


# ========== Helper functions ==========
def _round_if_needed(value: float, decimals: int = 2) -> float:
    """Round a float to a given number of decimals only when needed."""
    str_value = f"{value:.10f}".rstrip('0').rstrip('.')
    if '.' in str_value:
        current_decimals = len(str_value.split('.')[1])
        if current_decimals <= decimals:
            return value
    return round(float(value), decimals)


def _extract_features(point: dict, feature_names: List[str] = None) -> List[float]:
    """Extract feature values from a point dictionary."""
    import numpy as np
    
    if feature_names:
        raw_values = [float(point.get(name, 0)) for name in feature_names]
    else:
        # Extract values from dict and cast to native Python numeric types
        raw_values = [int(v) if isinstance(v, (np.integer, np.int64, np.int32)) else float(v) 
                     for v in point.values()]
    
    # Round to at most 3 decimal places
    return [_round_if_needed(v, 3) for v in raw_values]


def format_history_json(history: List[Dict], feature_names: List[str] = None) -> str:
    """Format history data as a JSON string."""
    if not history:
        return '{"data_points": []}'
    
    import numpy as np
    
    data_points = []
    for point in history:
        x = point.get("x", {})
        y = point.get("y", 0.0)
        
        features = _extract_features(x, feature_names)
        
        data_points.append({
            "features": features,
            "target": round(float(y), 3)
        })
    
    return json.dumps({"data_points": data_points}, separators=(',', ' '))


def format_points_json(points: List[Dict], feature_names: List[str] = None) -> str:
    """Format candidate points as a JSON string."""
    data_points = []
    for point in points:
        features = _extract_features(point, feature_names)
        data_points.append({"features": features})
    
    return json.dumps({"data_points": data_points}, separators=(',', ' '))


# ========== Task registry ==========
TASK_PROMPTS = {
    "FeCr": {
        "warmup": get_fecr_warmup_prompt,
        "prediction": get_fecr_prediction_prompt
    },
    "COF": {
        "warmup": get_cof_warmup_prompt,
        "prediction": get_cof_prediction_prompt
    },
    "Sandwich": {
        "warmup": get_sandwich_warmup_prompt,
        "prediction": get_sandwich_prediction_prompt
    },
    "Fullerene": {
        "warmup": get_fullerene_warmup_prompt,
        "prediction": get_fullerene_prediction_prompt
    },
    "P3HT": {
        "warmup": get_p3ht_warmup_prompt,
        "prediction": get_p3ht_prediction_prompt
    },
    "PCE10": {
        "warmup": get_pce10_warmup_prompt,
        "prediction": get_pce10_prediction_prompt
    },
    # Additional tasks can be added here if needed
}


def get_warmup_prompt(task_name: str, n_points: int = 5) -> Tuple[str, str]:
    """Return warmup prompt for a given task."""
    if task_name not in TASK_PROMPTS:
        raise ValueError(f"Unknown task: {task_name}. Available: {list(TASK_PROMPTS.keys())}")
    
    func = TASK_PROMPTS[task_name]["warmup"]
    return func(n_points)


def load_prompts(task_name: str) -> Tuple[str, List[str]]:
    """Load prompts for a given task (global system prompt + user prompt variants)."""
    system = SYSTEM_PROMPT
    
    if task_name not in TASK_PROMPTS:
        raise KeyError(f"Unknown task: {task_name}. Available: {list(TASK_PROMPTS.keys())}")
    
    # Get prediction prompt function
    prediction_func = TASK_PROMPTS[task_name]["prediction"]
    
    # Generate user prompt variants using the template (no data yet)
    _, user_template = prediction_func(history=None, points=None)
    
    # Return a single template; callers may build variants by changing history subsets
    user_prompts = [user_template]
    
    return system, user_prompts


def get_prediction_prompt(task_name: str, history: List[Dict], points: List[Dict]) -> Tuple[str, str]:
    """Return prediction prompt for a given task, filled with history and points."""
    if task_name not in TASK_PROMPTS:
        raise ValueError(f"Unknown task: {task_name}. Available: {list(TASK_PROMPTS.keys())}")
    
    func = TASK_PROMPTS[task_name]["prediction"]
    return func(history, points)

