import os
import json
from PIL import Image
import io
from torch.utils.data import Dataset
import logging
import pandas as pd

from Benchmarks.POPE.Eval import evaluate
from Benchmarks.POPE.PostProcess import postprocess_answer_pope

class POPE_Dataset(Dataset):
    def __init__(self, data_dir, num_samples=None):
        self.data_dir = data_dir
        self.data_list = []
        for file in os.listdir(self.data_dir):
            if file.endswith(".parquet"):
                df = pd.read_parquet(os.path.join(self.data_dir, file))
                self.data_list.extend(df.to_dict(orient="records"))
        if num_samples:
            self.data_list = self.data_list[:num_samples]

    def __len__(self):
        return len(self.data_list)

    def __getitem__(self, idx):
        item = self.data_list[idx]
        return {
            "image": Image.open(io.BytesIO(item["image"]['bytes'])).convert("RGB"),  # Ensure consistent image format
            "question": item["question"],
            "question_id": item["id"],
            "image_id": item["id"],
            "answers": item["answer"]
        }

def load_pope_dataset(data_dir, num_samples=None):
    try:
        print("🚀 Loading POPE dataset")
        dataset = POPE_Dataset(data_dir, num_samples)
        print(f"✅ Loading {len(dataset)} samples complete")
        return dataset
    except Exception as e:
        logging.error(f"⛔ Error loading POPE dataset: {e}")
        return None

def evaluate_pope_results(data_dir, result_dir, filename_suffix, num_samples, model_name, data_subtype=None, n_show_error=2):
    res_file = f'{result_dir}/Inference/{model_name}_POPE{filename_suffix}'

    results = json.load(open(res_file))
    pred_list = []
    label_list = []
    for result in results:
        label_list.append(result['ground_truth'])
        pred_list.append(postprocess_answer_pope(result['answer']))

    eval_result_str = evaluate(pred_list, label_list)
    json.dump(eval_result_str, open(f"{result_dir}/Eval/{model_name}_POPE_results.json", "w"), indent=4)

    return eval_result_str