import json

root_path = "/finance_ML/wuxiaojun/RAG/RAG-Factory/results/"
# path = /finance_ML/wuxiaojun/RAG/RAG-Factory/results/agriculture/graph_rag/agriculture_100_multi_v2_eval_requests.jsonl
path = root_path + "/cs/graph_rag/" + "cs_100_multistep_eval_requests.jsonl"
path = root_path + "/cs/graph_rag/" + "cs_100_tog3_eval_requests.jsonl"
# path = root_path + "/agriculture/graph_rag/" + "agriculture_100_multi_v2_eval_requests.jsonl"

with open(path, "r") as f:
    data = json.load(f)

data = data["responses"]

new_data = []
for item in data:
    item = item.replace("\n", "")
    item = item.strip("```json")
    item = item.strip("```")
    try:
        dict_item = json.loads(item)
        new_data.append(dict_item)
        # print(dict_item)
        # print("===")
    except json.JSONDecodeError:
        print("Failed to parse JSON:", item)
        continue

print(f"Parsed {len(new_data)} out of {len(data)} items.")

final_data = []
for item in new_data:
    new_item = {}
    for key, value in item.items():
        new_item[key] = value["Winner"]
    final_data.append(new_item)



with open(root_path +  "cs_100_multistep_eval_requests_new.jsonl", "w") as f:
    for item in new_data:
        f.write(json.dumps(item) + "\n")
with open(root_path + "cs_100_multistep_eval_requests_final.jsonl", "w") as f:
    for item in final_data:
        f.write(json.dumps(item) + "\n")

# count the number of each method being chosen as winner
method_count = {}
metrics = ["Comprehensiveness","Diversity", "Empowerment","Overall Winner"]
method_count = {metric : {} for metric in metrics}
for item in final_data:
    for metric in metrics:
        try:
            method = item[metric]
            if method not in method_count[metric]:
                method_count[metric][method] = 0
            method_count[metric][method] += 1
        except KeyError:
            pass
print("Method count:", method_count)

save_path = root_path + "broad_reasoning_metrics.json"
save_metrics = {}
for metric in metrics:
    # print(f"Metric: {metric}")
    total = sum(method_count[metric].values())
    for method, count in method_count[metric].items():
        percentage = count / total * 100
        # print(f"  {method}: {count} ({percentage:.2f}%)")
        save_metrics[metric] = save_metrics.get(metric, {})
        save_metrics[metric][method] = percentage


print(save_metrics)
with open(save_path, "w") as f:
    json.dump(save_metrics, f, indent=4)
