def fix_json(model_response: str) -> str:
    """
    Certain models, such as lmms-lab/llava-onevision-qwen2-7b-ov generate too many output tokens. This particular
    LLaVa generates "END OF XXX EXAMPLE" and then proceeds to generate subsequent outputs. This heuristic tries
    to detect such cases and delete the unnecessary trailing tokens.
    Other models, e.g. microsoft/Phi-3.5-vision-instruct, generate unnecessary prefix tokens.
    """

    # Remove leading tokens
    json_start_idx = model_response.find("{")
    if json_start_idx > 0:
        print(
            f"Hallucination intervention: detected unexpected leading tokens before '{{' in model's response at index: {json_start_idx}"
        )
        print(f"Before: {model_response}")
        model_response = model_response[json_start_idx:]
        print(f"After: {model_response}")

    # Remove trailing tokens
    json_end_idx = None
    num_characters = 0
    for line in model_response.split("\n"):
        if line == "}":
            json_end_idx = num_characters + 1
            break
        else:
            num_characters += len(line) + 1
    if json_end_idx is not None:
        print(
            f"Hallucination intervention: detected unexpected trailing tokens after '}}' in model's response at index: {json_end_idx}"
        )
        print(f"Before: {model_response}")
        model_response = model_response[:json_end_idx]
        print(f"After: {model_response}")

    return model_response
