{
    "math_word_problem_generation": {
        "gpt-4-0613": {
            "error_percentage": 55.00000000000001
        },
        "meta-llama/Llama-2-70b-chat-hf": {
            "error_percentage": 75.0
        }
    },
    "finegrained_fact_verification": {
        "gpt-4-0613": {
            "error_percentage": 55.714285714285715
        },
        "meta-llama/Llama-2-70b-chat-hf": {
            "error_percentage": 78.75
        }
    },
    "answerability_classification": {
        "gpt-4-0613": {
            "error_percentage": 57.85714285714286
        },
        "meta-llama/Llama-2-70b-chat-hf": {
            "error_percentage": 77.5
        }
    }
}