import json

import pytest

from src.postprocessing import fix_json

LEADING_AND_TRAILING_TOKENS_JSON = """
start of json
{
  "a": 2,
  "b": {
    "c": 4
  }
}
end of json
""".strip()


REPEATED_JSON = """
First example:
{
  "a": 2,
  "b": {
    "c": 4
  }
}
Second example:
{
  "a": 3,
  "b": {
    "c": 5
  }
}
third example ...
""".strip()


GPT_4_RESPONSE = """
Bongard problem:
Left images: All images show people skateboarding on rails or ledges.
Right images: All images show people skateboarding on flat surfaces or in motion without specific tricks.

First test image: The test image shows a person skateboarding in a skatepark, specifically performing a trick on a curved surface, which is similar to the skateboarding on rails or ledges as seen in the left images.

Second test image: The test image shows a person holding a skateboard, standing on a flat surface, which aligns with the theme of skateboarding on flat surfaces or in motion without specific tricks as seen in the right images.

Response:
```json
{
    "first": {
        "explanation": "The test image shows a person skateboarding in a skatepark on a curved surface, similar to the skateboarding on rails or ledges featured in all images on the left side.",
        "concept": "skateboarding on rails/ledges vs skateboarding on flat surfaces",
        "answer": "LEFT"
    },
    "second": {
        "explanation": "The test image shows a person holding a skateboard on a flat surface, aligning with the theme of skateboarding on flat surfaces or in motion without specific tricks as seen in the right images.",
        "concept": "skateboarding on rails/ledges vs skateboarding on flat surfaces",
        "answer": "RIGHT"
    }
}
```
"""


@pytest.mark.parametrize(
    "text,expected",
    [
        (LEADING_AND_TRAILING_TOKENS_JSON, {"a": 2, "b": {"c": 4}}),
        (REPEATED_JSON, {"a": 2, "b": {"c": 4}}),
    ],
)
def test_fix_json_returns_expected_dict(text: str, expected: dict):
    actual = fix_json(text)
    actual = json.loads(actual)
    assert expected == actual


@pytest.mark.parametrize("text", [GPT_4_RESPONSE])
def test_fix_json_returns_correctly_formatted_json_for_images_to_sides_binary_classification(
    text: str,
):
    actual = fix_json(text)
    actual = json.loads(actual)
    assert actual["first"]["answer"] in {"LEFT", "RIGHT"}
    assert actual["second"]["answer"] in {"LEFT", "RIGHT"}
