# All code is original unless otherwise noted.

import sys
import os
import argparse

# Parse command-line arguments
parser = argparse.ArgumentParser()
parser.add_argument('--path', type=str, required=True, help='Project root path')
parser.add_argument('--gpu', type=str, default='0', help='GPU device ID (CUDA_VISIBLE_DEVICES)')
args = parser.parse_args()

# Append project root path to sys.path for module importing
sys.path.append(args.path)

# Set visible CUDA devices
os.environ['CUDA_VISIBLE_DEVICES'] = args.gpu

# Change working directory to the project root
os.chdir(args.path)

# Optional: Print confirmation
print(f"CUDA_VISIBLE_DEVICES set to {args.gpu}")
print(f"Working directory changed to {args.path}")

# main
from utils.json_processor import read_json, write_json
from utils.split_step import split_step

InternVL_MPO_json = "inference/results/MMPR/InternVL-MPO/0.json"
InternVL_MPO_data = read_json(InternVL_MPO_json)
dataset_json = "dataset/MMPR/train.json"
dataset = read_json(dataset_json)

# 去掉没有final answer的
format_rule_candidate = []
for i in InternVL_MPO_data:
    if 'Final answer: ' in i['response']:
        format_rule_candidate.append(i)
print(len(format_rule_candidate))

# 建立树结构
tree = []
for i in format_rule_candidate:
    for j in range(5):
        id = i['id']
        sid = j + 1
        input = i['input']
        add = split_step(sid, i['response'])
        ground_truth = dataset[id]['ground_truth']
        image_path = dataset[id]['image_path']
        dataset_name = dataset[id]['dataset']
        if i['true_false']:
            score = 1
        else:
            score = 0
        tree.append({'id': id,
                     'sid': sid,
                     'input': input,
                     'add': add,
                     'ground_truth': ground_truth,
                     'image_path': image_path,
                     'dataset': dataset_name,
                     'score': score,
                     'times': 1,
                     'accuracy': score})
print(len(tree))

write_json("MC/results/MMPR/Tree/0.json", tree)

