import argparse
import json
import multiprocessing
import os
import re
import sys
import time
from concurrent.futures import ThreadPoolExecutor, as_completed
from pathlib import Path

from tqdm import tqdm

sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
from utils import (
    llm_generation,
)

# ----------------------------- #
# Prompt (already adapted by the user)
# ----------------------------- #

backend_test_prompt = """You are an expert in understanding website generation instructions. You will be given a website generation instruction, as well as a list of GUI test cases and expected results. Your task is to generate a list of backend test cases. Each backend test case should include an instruction regarding what to test, as well as the expected result of that test.

Requirements:
- A backend test case should contain an instruction and an expected result.
- The instruction should describe a specific functionality or feature of the backend that needs to be tested.
- The expected result should describe the expected outcome of the test.
- You should NEVER specify any names, paths, data, or other implementation details in the test cases. Instead, only describe what to test and the expected outcome.
- You should ONLY consider the backend functionalities that are absolutely necessary to fulfill the requirements of the website generation instruction and the GUI test cases. If a functionality is not necessary, do not include it in your output.
- Some of the requirements in the GUI test cases may not be relevant to backend testing. They might be achievable by the frontend alone. You should ignore those requirements and only focus on the backend functionalities.

Example:

Instruction: Create a blogging platform where users can register, create profiles, write blog posts, and comment on posts.

GUI Test Cases:
Instruction: Register a new user with valid details.
Expected Result: User is registered successfully and can log in.

Instruction: Create a new blog post.
Expected Result: Blog post is created and visible on the user's profile.

Instruction: Comment on a blog post.
Expected Result: Comment is added and visible under the blog post.

Instruction: Edit user profile information.
Expected Result: Profile information is updated successfully.

Thinking Process:
[several lines of reasoning about what backend functionalities are needed]

Output the backend test cases in JSON format as shown in the example below:
```json
{{
    "backend_test_cases": [
        {{
            "instruction": "Test the user registration API endpoint by sending a request with valid user information.",
            "expected_result": "Return a success response indicating the user is registered."
        }},
        {{
            "instruction": "Test the blog post creation API endpoint by sending a request with valid blog post data.",
            "expected_result": "Return a success response indicating the blog post is created."
        }},
        {{
            "instruction": "Test the blog post commenting API endpoint by sending a request with valid comment data.",
            "expected_result": "Return a success response indicating the comment is added."
        }},
        {{
            "instruction": "Test user profile update API endpoint by sending a request with updated profile information.",
            "expected_result": "Return a success response indicating the profile is updated."
        }}
    ]
}}
```

Now, based on the above requirements and example, please generate the list of data structures for the following instruction:

Instruction: {instruction}"""

# ----------------------------- #
# Helpers for JSONL I/O
# ----------------------------- #
def load_json(path):
    with open(path, "r", encoding="utf-8") as f:
        return json.load(f)

def dump_json(obj, path):
    Path(path).parent.mkdir(parents=True, exist_ok=True)
    with open(path, "w", encoding="utf-8") as f:
        json.dump(obj, f, ensure_ascii=False, indent=2)

def load_jsonl(path: str):
    """Return a list with one dict per line in the JSONL file."""
    with open(path, "r", encoding="utf-8") as f:
        return [json.loads(line) for line in f]

def dump_jsonl(objs, path: str):
    """Write a list of dicts to a JSONL file."""
    with open(path, "w", encoding="utf-8") as f:
        for obj in objs:
            f.write(json.dumps(obj, ensure_ascii=False) + "\n")

# ----------------------------- #
# Parsing the model output
# ----------------------------- #
_JSON_BLOCK_RE = re.compile(r"```json(.*?)```", re.S)


def extract_backend_tests(raw_text: str):
    """
    Extract the list of backend test-case dicts from the model's raw response.
    Returns [] if nothing could be parsed.
    """
    # 1) Prefer the fenced ```json … ``` block
    match = _JSON_BLOCK_RE.search(raw_text)
    json_src = match.group(1).strip() if match else raw_text

    # Try to parse as JSON
    try:
        parsed = json.loads(json_src)
        tests = parsed.get("backend_test_cases", [])
        if isinstance(tests, list):
            return tests
    except json.JSONDecodeError:
        pass

    # 2) Fallback: try to locate the first { … } block anywhere
    try:
        parsed = json.loads(re.search(r"\{.*\}", raw_text, re.S).group())
        return parsed.get("backend_test_cases", [])
    except Exception:
        return []  # give up

# ----------------------------- #
# Core generation wrapper
# ----------------------------- #
def generate_backend_tests(instruction: str):
    """
    Ask the LLM to create backend test cases for one instruction and return
    them as a list of dicts.
    """
    prompt = backend_test_prompt.format(instruction=instruction)
    messages = [{"role": "user", "content": prompt}]

    response = llm_generation(
        messages,
        model="Qwen3-Coder-480B-A35B-Instruct-FP8",  # adjust if needed
    )
    raw_content = response.get("content", "")
    return extract_backend_tests(raw_content)

# ----------------------------- #
# Per-sample worker
# ----------------------------- #
def process_sample(sample):
    """
    Generate backend tests for a single dataset entry.
    Returns the augmented sample dict.
    """
    inst = sample.get("instruction", "")
    tests = generate_backend_tests(inst)
    sample["backend_test_cases"] = tests
    return sample

# ----------------------------- #
# Main routine
# ----------------------------- #
def run_generation(input_path: str, output_path: str, max_workers: int | None = None):
    items = load_json(input_path)

    results = []
    max_workers = max_workers or min(32, multiprocessing.cpu_count() * 2)

    with ThreadPoolExecutor(max_workers=max_workers) as executor:
        futures = {executor.submit(process_sample, itm): idx for idx, itm in enumerate(items)}
        for fut in tqdm(as_completed(futures), total=len(items), desc="Generating backend tests"):
            idx = futures[fut]
            try:
                results.append(fut.result())
            except Exception as e:
                faulty = items[idx]
                faulty["backend_test_cases"] = []
                results.append(faulty)
                print(f"[WARN] Generation failed for id={faulty.get('id')}: {e}")

    # Preserve original ordering
    results.sort(key=lambda d: d.get("id", idx))

    Path(output_path).parent.mkdir(parents=True, exist_ok=True)
    dump_json(results, output_path)
    print(f"Saved {len(results)} items to {output_path}")

# ----------------------------- #
# CLI entry-point
# ----------------------------- #
def main():
    parser = argparse.ArgumentParser(description="Generate backend tests for WebGen-Bench")
    parser.add_argument(
        "-i", "--input",
        default="src/generate_fullstack_tests/WebGen-Bench_test-db.json",
        help="Path to input JSONL file"
    )
    parser.add_argument(
        "-o", "--output",
        default="src/generate_fullstack_tests/test_backend_model-gen.jsonl",
        help="Path to output JSONL file"
    )
    parser.add_argument(
        "-w", "--workers",
        type=int,
        default=8,
        help="Number of parallel threads (default: 2×CPU cores, max 32)"
    )
    args = parser.parse_args()
    t0 = time.time()
    run_generation(args.input, args.output, args.workers)
    print(f"Finished in {time.time() - t0:.1f}s")

# ----------------------------- #
if __name__ == "__main__":
    main()