import os

from tqdm import tqdm

from src.dataset.model import BongardDatasetInfo
from src.model.similarity_classifier import encode_texts, classify_to_sides
from src.strategy.d2s.model import (
    Answer,
    BongardDatasetDescriptions,
    DescriptionToSideResponse,
    DescriptionsToSidesExperiment,
    DescriptionsToSidesExperimentInstance,
    DescriptionsToSidesResponse,
    ExpectedAnswer,
)

DATASETS = [
    "rwr-plus",
    # "rwr-plus-2i",
    # "rwr-plus-3i",
    # "rwr-plus-4i",
    # "rwr-plus-5i",
    # "rwr-plus-6i",
]
# data_dir = "/app/data"
data_dir = "local-data"
method = "d2s_v2"
descriptor = "OpenGVLab/InternVL2_5-78B"
dataset_dir = "/home/Datasets"

for dataset_name in DATASETS:
    dataset = BongardDatasetInfo.from_directory(f"{dataset_dir}/{dataset_name}")
    descriptions: BongardDatasetDescriptions = BongardDatasetDescriptions.from_file(
        f"{data_dir}/{dataset_name}_i1d_v1/{descriptor}_descriptions.json"
    )
    descriptions_dict = descriptions.to_dict()
    instances = []

    for problem in tqdm(dataset.problems):
        problem_descriptions = descriptions_dict.get_descriptions_for_problem(problem)
        expected_answer = ExpectedAnswer(first=Answer.LEFT, second=Answer.RIGHT)
        request = problem_descriptions.create_request(problem, expected_answer)

        left = encode_texts(request.left_descriptions + [request.first])
        right = encode_texts(request.right_descriptions + [request.second])

        first, second = classify_to_sides(left, right, "euclidean", "max")
        instances.append(
            DescriptionsToSidesExperimentInstance(
                problem_id=problem.id,
                descriptions=problem_descriptions,
                response=DescriptionsToSidesResponse(
                    concept="",
                    first=DescriptionToSideResponse(
                        explanation="",
                        answer=first,
                    ),
                    second=DescriptionToSideResponse(
                        explanation="",
                        answer=second,
                    ),
                ),
                expected_answer=expected_answer,
            )
        )

    experiment = DescriptionsToSidesExperiment(
        descriptor_name=descriptor,
        solver_name="similarity-classifier",
        instances=instances,
    )
    os.makedirs(f"{data_dir}/{dataset_name}_{method}/{descriptor}", exist_ok=True)
    experiment.to_file(
        f"{data_dir}/{dataset_name}_{method}/{descriptor}/similarity-classifier_experiment.json"
    )
