#!/usr/bin/env python3
import sys, os
sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))
from mock_ges import generate_mock_synthesis_output
import json

# Load documents
docs = []
with open('corpus.jsonl', 'r') as f:
    for line in f:
        doc = json.loads(line)
        docs.append({"docid": doc["_id"], "text": doc["title"] + " " + doc["text"]})

# Generate evidence for each query
evidence_results = {}
for qid in ["Q001", "Q002", "Q003"]:
    result = generate_mock_synthesis_output(qid, docs, seed=42)
    evidence_results[qid] = result["multi_ges_scores"]

# Convert to TREC format
with open('multi_ges.trec', 'w') as f:
    for qid, scores in evidence_results.items():
        # Sort by GES score descending
        sorted_docs = sorted(scores.items(), key=lambda x: x[1], reverse=True)
        for rank, (docid, score) in enumerate(sorted_docs, 1):
            if score > 0:  # Only include documents with evidence
                f.write(f"{qid} Q0 {docid} {rank} {score:.6f} mock_ges\n")

print("Mock evidence scores generated")