{
    "aime25": {
        "name": "AIME Mathematical Problems",
        "path": "yentinglin/aime_2025",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}"
    },
    "aime24": {
        "name": "AIME Mathematical Problems",
        "path": "Maxwell-Jia/AIME_2024",
        "answer_type": "boxed",
        "id_field": "ID",
        "question_field": "Problem",
        "answer_field": "Answer",
        "prompt_template": "{question}"
    },
    "math500": {
        "name": "Math500",
        "path": "HuggingFaceH4/MATH-500",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "Math500 dataset"
    },
    "amc23":{
        "name": "AMC 2023",
        "path": "math-ai/amc23",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "question",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "AMC 2023 dataset"
    },
    "hmmt25": {
        "name": "HMMT February 2025",
        "path": "MathArena/hmmt_feb_2025",
        "answer_type": "boxed",
        "id_field": "problem_idx",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "HMMT 2025 dataset"
    },
    "brumo25": {
        "name": "BRUMO 2025",
        "path": "MathArena/brumo_2025",
        "answer_type": "boxed",
        "id_field": "problem_idx",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "BRUMO 2025 dataset"
    },
    "lightr1_76k": {
        "name": "LightR1-76k",
        "path": "data/formatted_data/stage1-76k.json",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "LightR1-76k dataset"
    },
    "deepmath": {
        "name": "DeepMath",
        "path": "data/formatted_data/DeepMath-103K.json",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "question",
        "answer_field": "final_answer",
        "prompt_template": "{question}",
        "description": "DeepMath dataset"
    },
    "lightr1_3k":{
        "name": "LightR1-3k",
        "path": "data/formatted_data/stage2-3k.json",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "LightR1-3k dataset"
    },
    "gsm8k":{
        "name": "GSM8K",
        "path": "data/formatted_data/gsm8k_test.json",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "test set of GSM8K dataset"
    },
    "olympiadbench":{
        "name": "OlympiadBench",
        "path": "data/formatted_data/olympiadbench.jsonl",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "question",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "test set of OlympiadBench dataset"
    },
    "gpqa":{
        "name": "GPQA",
        "path": "data/formatted_data/gpqa_diamond.jsonl",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "question",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "test set of GPQA dataset"
    },
    "chmath":{
        "name": "CHMath",
        "path": "data/formatted_data/chmath.jsonl",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "problem",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "test set of CHMath dataset"
    },
    "minerva":{
        "name": "Minerva",
        "path": "data/formatted_data/minerva.jsonl",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "question",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "test set of Minerva dataset"
    },
    "mmlu_stem":{
        "name": "MMLU-STEM",
        "path": "data/formatted_data/mmlu_stem.jsonl",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "question",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "test set of MMLU-STEM dataset"
    },
    "mmlu_redux":{
        "name": "MMLU-Redux",
        "path": "data/formatted_data/mmlu_redux.jsonl",
        "answer_type": "boxed",
        "id_field": "id",
        "question_field": "question",
        "answer_field": "answer",
        "prompt_template": "{question}",
        "description": "test set of MMLU-Redux dataset"
    }
}