#!/usr/bin/env python3
"""
Rewrite individual paper sections according to reviewer comments.
All paths are anonymized via ANON_PROJECT_ROOT.
"""

import re
import json
import shutil
import argparse
from create_util import *
from create_cite import *

# ---------- Arg Parsing ----------
parser = argparse.ArgumentParser(description="Reviewer-driven section rewrite")
parser.add_argument("--topics", required=True, help="Topic folder name.")
parser.add_argument("--topic_description", required=True, help="Sub-topic folder name.")
parser.add_argument("--model_name", default="deepseek-v3", help="Model for rewriting.")
parser.add_argument("--revision_name", required=True, help="Revision folder suffix.")
parser.add_argument("--model_used_for_review", required=True, help="Model that produced review JSON.")
args = parser.parse_args()

folder_name = args.topics
topic_description = args.topic_description
model_name = args.model_name
revision_name = args.revision_name
model_used_for_review = args.model_used_for_review

# ---------- Anonymous Base Directory ----------
BASE_DIR = os.environ.get("ANON_PROJECT_ROOT", "./anonymous_root")
WORK_DIR = os.path.join(BASE_DIR, folder_name, topic_description)
REVISION_DIR = os.path.join(WORK_DIR, revision_name)
BIB_FILE = os.path.join(REVISION_DIR, "iclr2025_conference.bib")

# ---------- Copy Clean LaTeX Tree ----------
shutil.copytree(os.path.join(WORK_DIR, "latex"), REVISION_DIR, dirs_exist_ok=True)

# ---------- Load Review Comments ----------
REVIEW_JSON = os.path.join(WORK_DIR, model_used_for_review, "iclr2025_conference", "iclr2025_conference.json")
with open(REVIEW_JSON, "r", encoding="utf-8") as f:
    review_data = json.load(f)

# keep only reviewer messages (skip author)
reviewer_comments = [
    msg["content"].lstrip()
    for msg in review_data["messages"]
    if msg.get("agent_name") != "Author"
]

# ---------- Section-wise Prompts ----------
SECTION_PROMPTS = {
    "abstract.tex": """
TL;DR of the paper.
What are we trying to do and why is it relevant?
Why is this hard?
How do we solve it (i.e., our contribution)?
How do we verify that we solved it (experiments and results)?
Produce a single smooth, well-motivated paragraph.
Wrap with \\begin{abstract}...\\end{abstract}.
Output only LaTeX inside ```latex```.
""",
    "introduction.tex": """
Longer version of the abstract.
Motivation, difficulty, contribution, validation.
List contributions explicitly if possible.
Use paragraphs, not lists.
Correct citations: \\cite{}, \\citet{}, \\citep{}; no bare "et al.".
Wrap LaTeX in ```latex```.
""",
    "background.tex": """
Academic ancestors: concepts and prior work required to understand our method.
Incorporate formal notation where helpful.
Paragraph format, no lists.
Correct citation commands.
Wrap LaTeX in ```latex```.
""",
    "methodology.tex": """
Describe what we do and why, using formalism from Background.
Include variables/formulas as needed.
Paragraph format, no lists.
Correct citations.
Wrap LaTeX in ```latex```.
""",
    "experiments_setting.tex": """
Describe datasets, baselines, metrics, implementation details.
Paragraph format preferred.
Cite open-source models and datasets; link closed-source ones.
Correct citation commands.
Wrap LaTeX in ```latex```.
""",
    "results.tex": """
Analyse every provided table in detail.
Do not alter table content.
Paragraph format, no lists.
Correct citations.
Wrap LaTeX in ```latex```.
""",
    "related_work.tex": """
Academic siblings: compare and contrast alternative approaches.
2–4 paragraphs, each led by a bold category summary.
Correct citations.
Wrap LaTeX in ```latex```.
""",
}

FILES_TO_REWRITE = [
    "abstract.tex", "introduction.tex", "background.tex",
    "methodology.tex", "experiments_setting.tex", "results.tex",
    "related_work.tex",
]

# ---------- Load Full Paper for Context ----------
full_paper = ""
for sec in FILES_TO_REWRITE:
    sec_path = os.path.join(REVISION_DIR, "content", sec)
    if os.path.exists(sec_path):
        with open(sec_path, "r", encoding="utf-8") as f:
            full_paper += f"%% ------ {sec} ------ %%\n" + f.read() + "\n\n"

# ---------- Rewrite Each Section ----------
for sec in FILES_TO_REWRITE:
    sec_path = os.path.join(REVISION_DIR, "content", sec)
    if not os.path.exists(sec_path):
        continue

    with open(sec_path, "r", encoding="utf-8") as f:
        original = f.read()

    prompt = f"""
1. Revise the specified section according to the reviewer suggestions.
2. Keep style consistent with the original.
3. Follow these writing tips:

{SECTION_PROMPTS[sec]}

4. Output only LaTeX inside ```latex```.

###### Section to Revise BEGIN ######
{original}
###### Section to Revise END ######

###### Full Paper for Reference BEGIN ######
{full_paper}
###### Full Paper for Reference END ######

###### Reviewer Comments BEGIN ######
{reviewer_comments}
###### Reviewer Comments END ######
"""

    model = ChatAgent(model_name)
    llm_output = model.chat({"role": "user", "content": prompt})

    # extract latex
    latex_match = re.search(r"```latex\n(.*?)\n```", llm_output, re.DOTALL)
    revised = latex_match.group(1) if latex_match else llm_output

    # sanitize citations
    get_cite(revised, BIB_FILE)
    delete_cite(revised, sec_path)

    with open(sec_path, "w", encoding="utf-8") as f:
        f.write(revised)

    logger.info(f"Rewritten {sec}")

# ---------- Re-compile PDF ----------
from create_pdf_revision import create_pdf
create_pdf(folder_name, topic_description, revision_name)