import json
import re
import random
import math

def extract_variables(prompt: str):
    """提取 prompt 中出现的单字母变量（包括 θ）"""
    vars = set(re.findall(r"\b([b-zB-Z])\b", prompt))
    if "θ" in prompt:
        vars.add("θ")
    return sorted(vars)

def split_pi(expr: str):
    """
    检查表达式是否含有 π。
    如果是，返回 (True, expr_without_pi)；否则 (False, expr)。
    """
    expr = expr.split("=", 1)[-1].strip()
    expr = expr.rstrip(".")
    expr = expr.replace("^", "**")

    if "π" in expr:
        expr_no_pi = expr.replace("π", "1", 1)
        return True, expr_no_pi
    else:
        return False, expr

def generate_instance(item, total_instances=4, value_range=(1, 15)):
    # ---- 获取量名 ----
    match = re.search(r"Its (.*?) can be calculated by the formula:", item["Formula"]["prompt"])
    if match:
        quantity = match.group(1).strip()
    else:
        quantity = item["Formula"]["target_new"].split("=")[0].strip()

    # ---- 构建模板 prompt ----
    base_prompt = re.sub(r"Its .*? can be calculated by the formula:", "", item["Formula"]["prompt"]).strip()
    template_prompt = re.sub(r"\b([b-zB-Z])\b", r"{\1}", base_prompt)
    template_prompt = template_prompt.replace("θ", r"{θ}")
    template_prompt = f"{template_prompt} What is its {quantity}? The answer is"

    # ---- 解析公式 ----
    has_pi, expr = split_pi(item["Formula"]["target_new"])
    variables = extract_variables(item["Formula"]["prompt"])

    instance_prompts = []
    instance_truths = []
    rephrase_prompts = []
    # 一半用模板问答（只答案），一半用原始prompt（计算过程+答案）
    for idx in range(total_instances):
        vals = {}

        for var in variables:
            if var == "θ":
                rad_val = random.randint(1, 6)  # θ 直接用弧度制，范围 [1,6]
                vals["θ"] = rad_val
            else:
                v = random.randint(*value_range)
                vals[var] = v

        try:
            result = eval(expr, {"math": math}, vals)
            if has_pi:
                result_str = f"{result}π"
            else:
                result_str = str(result)
        except Exception as e:
            result_str = f"Error: {e}"

        # if idx < total_instances // 2:
        #     # ---- 模板形式，只回答答案 ----
        #     instance_prompt = template_prompt.format(**vals)
        #     gt_entry = result_str
        # else:
        # ---- 原始公式形式，回答过程 + 答案 ----
        instance_prompt = item["Formula"]["prompt"]
        instance_rephrase_prompt = item["Formula"]["rephrase_prompt"]
        for var, val in vals.items():
            instance_prompt = re.sub(rf"\b{var}\b", str(val), instance_prompt)
            instance_rephrase_prompt = re.sub(rf"\b{var}\b", str(val), instance_rephrase_prompt)

        target_var = item["Formula"]["target_new"].split("=", 1)[0].strip()
        base_formula = item["Formula"]["target_new"].split("=", 1)[-1].strip().rstrip(".")
        base_formula = base_formula.replace("^", "**")
        gt_process = base_formula
        for var, val in vals.items():
            gt_process = re.sub(rf"\b{var}\b", str(val), gt_process)
        gt_process = gt_process.replace("**", "^")

        if "Error" not in result_str:
            if has_pi:
                gt_entry = f"{target_var} = {gt_process} = {result}π"
            else:
                gt_entry = f"{target_var} = {gt_process} = {result}"
        else:
            gt_entry = result_str

        instance_prompts.append(instance_prompt)
        instance_truths.append(gt_entry)
        rephrase_prompts.append(instance_rephrase_prompt)

    return {
        "prompt": instance_prompts,
        "target_new": instance_truths,
        "rephrase_prompt": rephrase_prompts
    }

def add_portability(input_file: str, output_file: str):
    with open(input_file, "r", encoding="utf-8") as f:
        data = json.load(f)

    for item in data:
        item["Instance"] = generate_instance(item)

    with open(output_file, "w", encoding="utf-8") as f:
        json.dump(data, f, ensure_ascii=False, indent=4)

    print(f"处理完成，结果保存到 {output_file}")


# 使用示例
add_portability("math_rule.json", "math_rule_instance.json")
