#!/usr/bin/env python3
"""
Reviewer-driven rewrite of paper sections with score-based gating.
All paths are anonymised via ANON_PROJECT_ROOT.
"""

import re
import json
import shutil
import argparse
import pandas as pd
from create_util import *
from create_cite import *

# ---------- Arg ----------
parser = argparse.ArgumentParser(description="Rewrite paper sections based on review score")
parser.add_argument("--original_csv_path", required=True, help="CSV with paper scores.")
parser.add_argument("--topic", required=True, help="Topic folder name.")
parser.add_argument("--topic_description", required=True, help="Sub-topic folder name.")
parser.add_argument("--model_name", default="deepseek-v3", help="LLM for rewriting.")
parser.add_argument("--revision_name", required=True, help="Revision folder suffix.")
parser.add_argument("--old_path_name", required=True, help="Previous revision to copy.")
parser.add_argument("--model_used_for_review", default="iclr2025_conference", help="Folder containing review JSON.")
parser.add_argument("--mode", default="normal", choices=["normal", "force"], help="Gate on score or always run.")
args = parser.parse_args()

original_csv_path   = args.original_csv_path
folder_name         = args.topic
topic_description   = args.topic_description
model_name          = args.model_name
revision_name       = args.revision_name
old_path_name       = args.old_path_name
model_used_for_review = args.model_used_for_review
mode                = args.mode

# ---------- Score Gate ----------
df = pd.read_csv(original_csv_path)
score_col = f"{old_path_name}_score" if old_path_name != "latex" else "llm_paper_score"
if mode == "normal":
    score = df.loc[df["topic_description"] == topic_description, score_col].iloc[0]
    if pd.isna(score) or score >= 6:
        print(f"{score_col} = {score} ≥ 6, exiting.")
        exit()
    print(f"{score_col} = {score} < 6, proceeding with rewrite.")

# ---------- Anonymous Base ----------
BASE_DIR   = os.environ.get("ANON_PROJECT_ROOT", "./anonymous_root")
old_path   = os.path.join(BASE_DIR, folder_name, topic_description, old_path_name)
new_path   = os.path.join(BASE_DIR, folder_name, topic_description, revision_name)
bib_file   = os.path.join(new_path, "iclr2025_conference.bib")

# ---------- Copy Previous Revision ----------
if not os.path.exists(new_path):
    shutil.copytree(old_path, new_path)

# ---------- Load Review ----------
review_json = os.path.join(
    BASE_DIR, folder_name, topic_description,
    old_path_name if old_path_name != "latex" else model_used_for_review,
    "iclr2025_conference", "iclr2025_conference.json"
)
with open(review_json, "r", encoding="utf-8") as f:
    review_data = json.load(f)

reviewer_comments = [
    msg["content"].lstrip()
    for msg in review_data["messages"]
    if msg.get("agent_name") != "Author"
]

# ---------- Section Guidance ----------
SECTION_PROMPTS = {
    "abstract.tex": """
TL;DR of the paper.
What are we trying to do and why is it relevant?
Why is this hard?
How do we solve it (i.e., our contribution)?
How do we verify that we solved it (experiments and results)?
One smooth paragraph, wrapped in \\begin{abstract}...\\end{abstract}.
Output only LaTeX inside ```latex```.
""",
    "introduction.tex": """
Longer version of the abstract.
Motivation, difficulty, contribution, validation.
List contributions explicitly if desired.
Paragraphs, not lists.
Correct citations: \\cite{}, \\citet{}, \\citep{}; no bare "et al.".
Output only LaTeX inside ```latex```.
""",
    "background.tex": """
Academic ancestors: concepts and prior work required for our method.
Incorporate formal notation where helpful.
Paragraph format, no lists.
Correct citations.
Output only LaTeX inside ```latex```.
""",
    "methodology.tex": """
What we do and why, using the formalism of the Background.
Include variables/formulas as needed.
Paragraph format, no lists.
Correct citations.
Output only LaTeX inside ```latex```.
""",
    "experiments_setting.tex": """
Datasets, baselines, metrics, implementation details.
Paragraph format preferred.
Cite open-source models/datasets; link closed-source ones.
Correct citations.
Output only LaTeX inside ```latex```.
""",
    "results.tex": """
Analyse every provided table in detail.
Do not alter table content.
Paragraph format, no lists.
Correct citations.
Output only LaTeX inside ```latex```.
""",
    "related_work.tex": """
Academic siblings: compare & contrast alternative approaches.
2–4 paragraphs, each led by a bold category summary.
Correct citations.
Output only LaTeX inside ```latex```.
""",
}

FILES = list(SECTION_PROMPTS.keys())

# ---------- Full-paper Context ----------
paper_all = ""
for file in FILES:
    sec_path = os.path.join(new_path, "content", file)
    if os.path.exists(sec_path):
        with open(sec_path, "r", encoding="utf-8") as f:
            paper_all += f.read() + "\n\n"

# ---------- Rewrite Each Section ----------
for file in FILES:
    sec_path = os.path.join(new_path, "content", file)
    if not os.path.exists(sec_path):
        continue

    with open(sec_path, "r", encoding="utf-8") as f:
        paper_now = f.read()

    prompt = f"""
1. Revise the section according to reviewer suggestions.
2. Keep style consistent with the previous version.
3. Follow these writing tips:

{SECTION_PROMPTS[file]}

4. Output only LaTeX inside ```latex```.

###### Section {file} to Revise BEGIN ######
{paper_now}
###### Section {file} to Revise END ######

###### Full Paper Context BEGIN ######
{paper_all}
###### Full Paper Context END ######

###### Reviewer Comments BEGIN ######
{reviewer_comments}
###### Reviewer Comments END ######
"""

    model = ChatAgent(model_name)
    llm_out = model.chat({"role": "user", "content": prompt})

    latex_match = re.search(r"```latex\n(.*?)\n```", llm_out, re.DOTALL)
    revised = latex_match.group(1) if latex_match else llm_out

    get_cite(revised, bib_file)
    delete_cite(revised, sec_path)

    with open(sec_path, "w", encoding="utf-8") as f:
        f.write(revised)

# ---------- Re-compile PDF ----------
from create_pdf_revision import create_pdf
create_pdf(folder_name, topic_description, revision_name)