{
  "models": [
    "HuggingFaceTB/SmolLM3-3B-Base",
    "Qwen/Qwen2.5-3B",
    "Qwen/Qwen2.5-7B-Instruct",
    "Qwen/Qwen2.5-Math-7B-Instruct",
    "Qwen/Qwen3-1.7B-Base",
    "Qwen/Qwen3-4B",
    "Qwen/Qwen3-4B-Base",
    "Qwen/Qwen3-4B-Instruct-2507",
    "deepseek-ai/DeepSeek-Math-7B-Instruct",
    "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
    "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",
    "deepseek-ai/deepseek-math-7b-instruct",
    "google/gemma-3-4b-it",
    "google/gemma-3-4b-pt"
  ],
  "datasets": [
    {
      "dataset": "AI-MO/aimo-validation-aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "AI-MO/aimo-validation-amc",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "AI-MO/aimo-validation-math-level-5",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "AI-MO/NuminaMath-CoT",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "AI-MO/NuminaMath-TIR",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "AIMERgzr/PapperScore",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "AMead10/Universal-glaive-function-calling-v2",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Asap7772/aime_gpt-4o-mini_responses_evaluated_flatturn",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "AymanTarig/function-calling-v0.2-with-r1-cot",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "BitAgent/tool_calling",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "BitStarWalkin/AIME_1983_2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "chilleD/SVAMP",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "CohereLabs/m-ArenaHard-v2.0",
      "config": "en",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "Deepexi/function-calling-small",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Digital-nimbus/llama-2-oai-function-calling",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "EleutherAI/hendrycks_math",
      "configs": [
        "algebra",
        "counting_and_probability",
        "geometry",
        "intermediate_algebra",
        "number_theory"
      ],
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "GBaker/MedQA-USMLE-4-options",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "Goekdeniz-Guelmez/Function_Calling_Unfiltered",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "HuggingFaceH4/aime_2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "HuggingFaceH4/Bespoke-Stratos-17k",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "HuggingFaceH4/CodeAlpaca_20K",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "HuggingFaceH4/ultrachat_200k",
      "splits": [
        "test_gen",
        "test_sft",
        "train_gen",
        "train_sft"
      ]
    },
    {
      "dataset": "HuggingFaceH4/ultrafeedback_binarized",
      "splits": [
        "test_gen",
        "test_prefs",
        "test_sft",
        "train_gen",
        "train_prefs",
        "train_sft"
      ]
    },
    {
      "dataset": "HydraLM/glaive_function_calling_v1_standardized",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Idavidrein/gpqa",
      "configs": [
        "gpqa_diamond",
        "gpqa_experts",
        "gpqa_extended",
        "gpqa_main"
      ],
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Locutusque/hercules-v2.0",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "LongQ/leetcode_python",
      "splits": [
        "dev",
        "test",
        "train"
      ]
    },
    {
      "dataset": "MCES10-Software/Python-Code-Solutions",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "magpie-align/Magpie-Pro-300K-Filtered",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Magpie-Align/Magpie-Qwen2.5-Math-Pro-300K-v0.1",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Magpie-Align/Magpie-Qwen2.5-Pro-300K-Filtered",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Maxwell-Jia/AIME_2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Na0s/sft-ready-hendrycks-competition_math",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Nan-Do/code-search-net-python",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Nan-Do/instructional_code-search-net-python",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "NewEden/xlam-function-calling-60k-shareGPT",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "NousResearch/hermes-function-calling-v1",
      "config": "func_calling_singleturn",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Open-Orca/SlimOrca",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Pandores/aime-1983-2025",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Post-training-Data-Flywheel/gorilla-openfunctions-v1",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Prompt48/AIME_Problem_Set_1983-2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "RayBernard/leetcode",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "RayBernard/leetcode1000",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Rock23210/AIME_Deepseek_Clean",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Saxo/alpaca_function_calling_dataset",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "TIGER-Lab/MathInstruct",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "TIGER-Lab/MMLU-Pro",
      "splits": [
        "test",
        "validation"
      ]
    },
    {
      "dataset": "TIGER-Lab/TheoremQA",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "TigerResearch/tigerbot-kaggle-leetcodesolutions-en-2k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Vishal24/function_calling",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "XxCotHGxX/242K_Python_Docstring_Pairs",
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "Zaynes/multiple_samples_sympy_numina_aime_with_sol_trace",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "ZeroAgency/gemma3-pythonic-function-tool-calling-v1",
      "splits": [
        "test",
        "train",
        "valid"
      ]
    },
    {
      "dataset": "aadajinkya/python_codes_sample",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "agentlans/train-of-thought",
      "config": "train",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "allenai/ai2_arc",
      "configs": [
        "ARC-Challenge",
        "ARC-Easy"
      ],
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "allenai/openbookqa",
      "config": "main",
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "allenai/qasc",
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "allenai/sciq",
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "allenporter/assist-llm-function-calling",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "cais/mmlu",
      "configs": [
        "abstract_algebra",
        "all",
        "anatomy",
        "astronomy",
        "auxiliary_train",
        "clinical_knowledge",
        "college_biology",
        "college_chemistry",
        "college_computer_science",
        "college_mathematics",
        "college_medicine",
        "college_physics",
        "computer_security",
        "conceptual_physics",
        "electrical_engineering",
        "elementary_mathematics",
        "high_school_biology",
        "high_school_chemistry",
        "high_school_computer_science",
        "high_school_mathematics",
        "high_school_physics",
        "high_school_statistics",
        "human_aging",
        "machine_learning",
        "medical_genetics",
        "nutrition",
        "professional_medicine",
        "virology"
      ],
      "splits": [
        "auxiliary_train",
        "dev",
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "camel-ai/biology",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "camel-ai/chemistry",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "camel-ai/math",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "camel-ai/physics",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "chenggong1995/MATH-lighteval-olympiads_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "codeparrot/codecomplex",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "dakopi/aime_23",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "daman1209arora/jeebench",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "deepmind/aqua_rat",
      "config": "raw",
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "deepmind/code_contests",
      "splits": [
        "test",
        "train",
        "valid"
      ]
    },
    {
      "dataset": "derek-thomas/ScienceQA",
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "di-zhang-fdu/AIME_1983_2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "dim/competition_math",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "dim/competition_math_selected",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "dim/leetcodesolutions_en_2k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "dinushiTJ/gemma-function-calling",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-gaokao-biology",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-gaokao-chemistry",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-gaokao-mathqa",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-gaokao-physics",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-logiqa-en",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-lsat-ar",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-lsat-lr",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-sat-en",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "dmayhem93/agieval-sat-math",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "evalplus/mbppplus",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "flytech/python-codes-25k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "garage-bAInd/Open-Platypus",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "glaiveai/glaive-function-calling",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "glaiveai/Glaive-function-calling-v2",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "gneubig/aime-1983-2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "google-research-datasets/mbpp",
      "configs": [
        "full",
        "sanitized"
      ],
      "splits": [
        "prompt",
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "gorilla-llm/Berkeley-Function-Calling-Leaderboard",
      "configs": [
        "chatable",
        "exec_multiple",
        "exec_parallel_multiple",
        "exec_simple",
        "java",
        "javascript",
        "parallel",
        "rest",
        "sql"
      ],
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "greengerong/leetcode",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "hbXNov/numina_amc_aime_deepseek_r1_responses",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "hbXNov/numina_amc_aime_in_depth_deepseek_r1_questions",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "hendrydong/aime24",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "hiyouga/glaive-function-calling-v2-sharegpt",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "huntz47/aimee",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "hypervariance/function-calling-sharegpt",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "iamtarun/python_code_instructions_18k_alpaca",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "interstellarninja/tool-calls-singleturn",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "ise-uiuc/Magicoder-Evol-Instruct-110K",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "ise-uiuc/Magicoder-OSS-Instruct-75K",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jinaai/code_search_net_clean",
      "splits": [
        "test.go",
        "test.java",
        "test.javascript",
        "test.php",
        "test.python",
        "test.ruby",
        "train.go",
        "train.java",
        "train.javascript",
        "train.php",
        "train.python",
        "train.ruby",
        "validation.go",
        "validation.java",
        "validation.javascript",
        "validation.php",
        "validation.python",
        "validation.ruby"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_deepseek-r1-distill-qwen-1.5b_traces_32768",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_deepseek-r1-distill-qwen-14b_traces_32768",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_deepseek-r1-distill-qwen-7b_traces_32768",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_deepseek-r1_traces_16384",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_deepseek-r1_traces_32768",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_grok-3-mini-high_traces_32768",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_qwq-32b_traces_16384",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "jonathanyin/aime_1983_2023_qwq-32b_traces_32768",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "khaimaitien/multi-hop-qa-function-calling-format-V1.0",
      "splits": [
        "train",
        "validation"
      ]
    },
    {
      "dataset": "lighteval/mmlu",
      "configs": [
        "abstract_algebra",
        "all"
      ],
      "splits": [
        "auxiliary_train",
        "dev",
        "test",
        "validation"
      ]
    },
    {
      "dataset": "lockon/glaive_toolcall_en",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "m-a-p/CodeFeedback-Filtered-Instruction",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "martim00/math_aime_2023",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "math-ai/aime24",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "math-ai/aime25",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "meta-math/MetaMathQA",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "microsoft/orca-math-word-problems-200k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "milsunone/cural-functionary-small-5000",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mjalg/function-code",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/4o_annotated_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/a1_math_numina_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/a1_math_openmathinstruct_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/bespokelabs-sky-t1-numina-amc-aime-subset-unfiltered",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/multiple_samples_all_numina_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/multiple_samples_ground_truth_numina_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/multiple_samples_majority_consensus_numina_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/multiple_samples_majority_consensus_numina_aime_math_verify",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "mlfoundations-dev/r1_annotated_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "narrative-io/narrative-function-calling-v1",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "nickrosh/Evol-Instruct-Code-80k-v1",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "notbadai/python_functions_reasoning",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "nvidia/OpenCodeInstruct",
      "config": "train",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "nvidia/OpenMathInstruct-1",
      "splits": [
        "train",
        "validation"
      ]
    },
    {
      "dataset": "open-r1/codeforces",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "open-r1/OpenR1-Math-220k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "openai/gsm8k",
      "configs": [
        "default",
        "main"
      ],
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "openai/openai_humaneval",
      "config": "openai_humaneval",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "philschmid/AIME_1983_2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "prem-research/Funcdex-MT-Function-Calling",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "qfq/genminiall_onlyqwenwrong_aimegpqatrain_domain_powerlaw_steps",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "qwedsacf/competition_math",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "redwoodresearch/mbpp_extended",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "roborovski/synthetic-tool-calls",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "roborovski/synthetic-tool-calls-v2",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "rulins/DeepSeek-R1-Distill-Qwen-32B_NUMINA_train_amc_aime",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "sahil2801/CodeAlpaca-20k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "semeru/text-code-galeras-code-generation-from-docstring-3k-deduped",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "sharkchill-xy/HumanEval_mbpp_format",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "simplescaling/aime_nofigures",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "smolagents/toolcalling",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "starfishdata/AIME_MATH_1000_LONG_COT",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "starfishdata/AIME_MATH_100_LONG_COT",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "tau/commonsense_qa",
      "splits": [
        "test",
        "train",
        "validation"
      ]
    },
    {
      "dataset": "teknium/OpenHermes-2.5",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "theblackcat102/evol-codealpaca-v1",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "think-a-tron/aime-math-train",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "togethercomputer/glaive-function-calling-v2-formatted",
      "splits": [
        "test",
        "train"
      ]
    },
    {
      "dataset": "TokenBender/code_instructions_122k_alpaca_style",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "vikp/python_code_instructions_filtered",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "weijiezz/math-datasets-100k",
      "splits": [
        "test_aime24",
        "test_aime25",
        "test_amc23",
        "test_gsm8k",
        "test_math500",
        "test_minervamath",
        "test_olympiadbench",
        "train"
      ]
    },
    {
      "dataset": "weijiezz/math-datasets-20k",
      "splits": [
        "test_aime24",
        "test_aime25",
        "test_amc23",
        "test_gsm8k",
        "test_math500",
        "test_minervamath",
        "test_olympiadbench",
        "train"
      ]
    },
    {
      "dataset": "weijiezz/NuminaMath-20k",
      "splits": [
        "test_aime24",
        "test_aime25",
        "test_amc23",
        "test_gsm8k",
        "test_math500",
        "test_minervamath",
        "test_numina",
        "test_olympiadbench",
        "train"
      ]
    },
    {
      "dataset": "xw27/scibench",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "yahma/alpaca-cleaned",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "zhiyuanhucs/AIME_1983_2024",
      "splits": [
        "aime"
      ]
    },
    {
      "dataset": "zhuzilin/aime-2024",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "zuom/AIME-solutions",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "ByteDance-Seed/Code-Contests-Plus",
      "config": null
    },
    {
      "dataset": "WNJXYK/AIME_1983_2024-Reasoning-Paths",
      "config": null
    },
    {
      "dataset": "internlm/Agent-FLAN",
      "config": null
    },
    {
      "dataset": "nvidia/OpenMathInstruct-2",
      "config": null
    },
    {
      "dataset": "AmazonScience/FalseReject"
    },
    {
      "dataset": "Anthropic/hh-rlhf"
    },
    {
      "dataset": "AtlasUnified/atlas-math-sets"
    },
    {
      "dataset": "BAAI/Infinity-Preference"
    },
    {
      "dataset": "CarperAI/openai_summarize_comparisons"
    },
    {
      "dataset": "CarperAI/openai_summarize_tldr"
    },
    {
      "dataset": "ChilleD/MultiArith"
    },
    {
      "dataset": "ChilleD/StrategyQA"
    },
    {
      "dataset": "CohereForAI/aya_dataset"
    },
    {
      "dataset": "CohereLabs/Global-MMLU",
      "splits": [
        "am",
        "ar",
        "bn",
        "cs",
        "de",
        "el",
        "en",
        "es",
        "fa",
        "fil",
        "fr",
        "ha",
        "he",
        "hi",
        "id",
        "ig",
        "it",
        "ja",
        "ko",
        "ky",
        "lt",
        "mg",
        "ms",
        "ne",
        "nl",
        "ny",
        "pl",
        "pt",
        "ro",
        "ru",
        "si",
        "sn",
        "so",
        "sr",
        "sv",
        "sw",
        "te",
        "tr",
        "uk",
        "vi",
        "yo",
        "zh"
      ]
    },
    {
      "dataset": "GAIR/LIMA"
    },
    {
      "dataset": "HuggingFaceH4/no_robots"
    },
    {
      "dataset": "HuggingFaceTB/MagPie-Pro-300k-MT"
    },
    {
      "dataset": "InclusionAI/Ling-Coder-SFT"
    },
    {
      "dataset": "Intel/orca_dpo_pairs"
    },
    {
      "dataset": "LDJnr/Capybara"
    },
    {
      "dataset": "LDJnr/Puffin"
    },
    {
      "dataset": "Muennighoff/natural-instructions"
    },
    {
      "dataset": "Nexusflow/NexusRaven_API_evaluation"
    },
    {
      "dataset": "Norquinal/claude_multiround_chat_30k"
    },
    {
      "dataset": "NousResearch/CharacterCodex"
    },
    {
      "dataset": "Open-Orca/OpenOrca"
    },
    {
      "dataset": "OpenAI/summarize_from_feedback"
    },
    {
      "dataset": "OpenAssistant/oasst1"
    },
    {
      "dataset": "OpenAssistant/oasst2"
    },
    {
      "dataset": "OpenAssistant/oasst_top1_2023-08-25"
    },
    {
      "dataset": "PKU-Alignment/BeaverTails"
    },
    {
      "dataset": "PKU-Alignment/PKU-SafeRLHF"
    },
    {
      "dataset": "PygmalionAI/PIPPA"
    },
    {
      "dataset": "Skywork/Skywork-Reward-Preference-80K-v0.2"
    },
    {
      "dataset": "THUDM/AgentInstruct"
    },
    {
      "dataset": "WizardLM/WizardLM_evol_instruct_70k"
    },
    {
      "dataset": "WizardLM/WizardLM_evol_instruct_V2_143k"
    },
    {
      "dataset": "WizardLM/WizardLM_evol_instruct_V2_196k"
    },
    {
      "dataset": "allenai/WildChat"
    },
    {
      "dataset": "allenai/WildChat-1M"
    },
    {
      "dataset": "allenai/qasper"
    },
    {
      "dataset": "allenai/real-toxicity-prompts"
    },
    {
      "dataset": "allenai/soda"
    },
    {
      "dataset": "allenai/tulu-2.5-preference-data"
    },
    {
      "dataset": "allenai/tulu-3-pref-personas-instruction-following"
    },
    {
      "dataset": "allenai/tulu-3-sft-mixture"
    },
    {
      "dataset": "allenai/tulu-v2-sft-mixture"
    },
    {
      "dataset": "anon8231489123/ShareGPT_Vicuna_unfiltered"
    },
    {
      "dataset": "argilla/distilabel-intel-orca-dpo-pairs"
    },
    {
      "dataset": "argilla/ultrafeedback-binarized-preferences-cleaned"
    },
    {
      "dataset": "argilla/ultrafeedback-multi-binarized-preferences-cleaned"
    },
    {
      "dataset": "b-mc2/sql-create-context"
    },
    {
      "dataset": "bavard/personachat_truecased"
    },
    {
      "dataset": "berkeley-nest/Nectar"
    },
    {
      "dataset": "bigcode/commitpackft"
    },
    {
      "dataset": "bigcode/self-oss-instruct-sc2-exec-filter-50k"
    },
    {
      "dataset": "camel-ai/ai_society"
    },
    {
      "dataset": "ccdv/arxiv-summarization"
    },
    {
      "dataset": "ccdv/govreport-summarization"
    },
    {
      "dataset": "codeparrot/apps"
    },
    {
      "dataset": "cognitivecomputations/dolphin-coder"
    },
    {
      "dataset": "cognitivecomputations/samantha-data"
    },
    {
      "dataset": "databricks/databricks-dolly-15k"
    },
    {
      "dataset": "emozilla/quality"
    },
    {
      "dataset": "euclaise/writingprompts"
    },
    {
      "dataset": "fka/awesome-chatgpt-prompts"
    },
    {
      "dataset": "glaiveai/glaive-code-assistant"
    },
    {
      "dataset": "google/IFEval"
    },
    {
      "dataset": "gretelai/synthetic_text_to_sql"
    },
    {
      "dataset": "qwedsacf/competition_math"
    },
    {
      "dataset": "hkust-nlp/deita-10k-v0"
    },
    {
      "dataset": "hkust-nlp/deita-6k-v0"
    },
    {
      "dataset": "jondurbin/airoboros-2.2"
    },
    {
      "dataset": "jondurbin/airoboros-gpt4-1.4.1"
    },
    {
      "dataset": "jondurbin/gutenberg-dpo-v0.1"
    },
    {
      "dataset": "kaist-ai/CoT-Collection"
    },
    {
      "dataset": "kmfoda/booksum"
    },
    {
      "dataset": "knkarthick/dialogsum"
    },
    {
      "dataset": "lmsys/chatbot_arena_conversations"
    },
    {
      "dataset": "lmsys/lmsys-chat-1m"
    },
    {
      "dataset": "lmsys/mt_bench_human_judgments"
    },
    {
      "dataset": "mlabonne/FineTome-100k"
    },
    {
      "dataset": "mlabonne/orpo-dpo-mix-40k"
    },
    {
      "dataset": "nampdn-ai/tiny-codes"
    },
    {
      "dataset": "neulab/conala"
    },
    {
      "dataset": "newfacade/LeetCodeDataset"
    },
    {
      "dataset": "nomic-ai/gpt4all-j-prompt-generations"
    },
    {
      "dataset": "nvidia/HelpSteer"
    },
    {
      "dataset": "nvidia/HelpSteer2"
    },
    {
      "dataset": "nvidia/HelpSteer3"
    },
    {
      "dataset": "open-r1/Mixture-of-Thoughts"
    },
    {
      "dataset": "openai/webgpt_comparisons"
    },
    {
      "dataset": "openbmb/UltraFeedback"
    },
    {
      "dataset": "openbmb/UltraInteract_sft"
    },
    {
      "dataset": "openchat/openchat_sharegpt4_dataset"
    },
    {
      "dataset": "rajpurkar/squad_v2"
    },
    {
      "dataset": "skg/toxigen-data"
    },
    {
      "dataset": "stanfordnlp/SHP"
    },
    {
      "dataset": "stanfordnlp/SHP-2"
    },
    {
      "dataset": "stingning/ultrachat"
    },
    {
      "dataset": "tatsu-lab/alpaca"
    },
    {
      "dataset": "tatsu-lab/alpaca_farm"
    },
    {
      "dataset": "teknium/GPT4-LLM-Cleaned"
    },
    {
      "dataset": "teknium/openhermes"
    },
    {
      "dataset": "tiedong/goat"
    },
    {
      "dataset": "timdettmers/openassistant-guanaco"
    },
    {
      "dataset": "truthfulqa/truthful_qa"
    },
    {
      "dataset": "vicgalle/alpaca-gpt4"
    },
    {
      "dataset": "wics/strategy-qa"
    },
    {
      "dataset": "xlangai/DS-1000"
    },
    {
      "dataset": "yizhongw/self_instruct"
    },
    {
      "dataset": "lvwerra/codeparrot-valid-clean-minimal"
    },
    {
      "dataset": "cognitivecomputations/dolphin"
    },
    {
      "dataset": "openlifescienceai/medmcqa",
      "splits": [
        "train",
        "validation",
        "test"
      ]
    },
    {
      "dataset": "qiaojin/PubMedQA",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "bigbio/pubmed_qa",
      "config": "pubmed_qa_labeled_fold0_source",
      "splits": [
        "train",
        "validation",
        "test"
      ]
    },
    {
      "dataset": "medalpaca/medical_meadow_medqa",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "medalpaca/medical_meadow_wikidoc",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "medalpaca/medical_meadow_wikidoc_patient_information",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "medalpaca/medical_meadow_medical_flashcards",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "lavita/ChatDoctor-HealthCareMagic-100k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "keivalya/MedQuad-MedicalQnADataset",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "Mohammed-Altaf/medical-instruction-100k",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "ruslanmv/ai-medical-chatbot",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "gamino/wiki_medical_terms",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "nlpie/Llama2-MedTuned-Instructions",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "axiong/pmc_llama_instructions",
      "splits": [
        "train"
      ]
    },
    {
      "dataset": "AdaptLLM/medicine-tasks",
      "splits": [
        "test"
      ]
    },
    {
      "dataset": "bigbio/med_qa"
    },
    {
      "dataset": "lavita/medical-qa-datasets"
    },
    {
      "dataset": "ncbi/Open-Patients"
    },
    {
      "dataset": "HPAI-BSC/medical-specialities"
    },
    {
      "dataset": "HPAI-BSC/MedQA-Mixtral-CoT"
    },
    {
      "dataset": "HPAI-BSC/Medprompt-MedQA-CoT"
    },
    {
      "dataset": "UCSD26/medical_dialog"
    },
    {
      "dataset": "bigbio/meddialog"
    },
    {
      "dataset": "AGBonnet/augmented-clinical-notes"
    },
    {
      "dataset": "omi-health/medical-dialogue-to-soap-summary"
    },
    {
      "dataset": "knowrohit07/know_medical_dialogue_v2"
    },
    {
      "dataset": "har1/MTS_Dialogue-Clinical_Note"
    },
    {
      "dataset": "mahfoos/Patient-Doctor-Conversation"
    },
    {
      "dataset": "casey-martin/MedInstruct"
    },
    {
      "dataset": "Detsutut/MedInstruct"
    },
    {
      "dataset": "dmis-lab/meerkat-instructions"
    },
    {
      "dataset": "shibing624/medical"
    },
    {
      "dataset": "FreedomIntelligence/medical-o1-reasoning-SFT"
    },
    {
      "dataset": "starmpcc/Asclepius-Synthetic-Clinical-Notes"
    },
    {
      "dataset": "thbndi/Mimic4Dataset"
    },
    {
      "dataset": "Amod/mental_health_counseling_conversations"
    },
    {
      "dataset": "ShenLab/MentalChat16K"
    },
    {
      "dataset": "heliosbrahma/mental_health_conversational_dataset"
    },
    {
      "dataset": "vibhorag101/phr_mental_therapy_dataset"
    },
    {
      "dataset": "entfane/psychotherapy"
    },
    {
      "dataset": "fadodr/mental_health_therapy"
    },
    {
      "dataset": "Psychotherapy-LLM/CBT-Bench"
    },
    {
      "dataset": "d4data/biomedical-ner-all"
    },
    {
      "dataset": "bigbio/n2c2_2018_track2"
    },
    {
      "dataset": "HiTZ/Multilingual-Medical-Corpus"
    },
    {
      "dataset": "claws-lab/XLingHealth"
    },
    {
      "dataset": "Trelis/hh-rlhf-dpo"
    },
    {
      "dataset": "RLHFlow/HH-RLHF-Helpful-standard"
    },
    {
      "dataset": "openlifescienceai/mmlu_clinical_knowledge"
    },
    {
      "dataset": "openlifescienceai/mmlu_college_medicine"
    },
    {
      "dataset": "openlifescienceai/mmlu_medical_genetics"
    },
    {
      "dataset": "openlifescienceai/mmlu_professional_medicine"
    },
    {
      "dataset": "bigbio/bionli"
    },
    {
      "dataset": "head_qa"
    },
    {
      "dataset": "casperhansen/liveqa"
    },
    {
      "dataset": "lavita/AlpaCare-MedInstruct-52k"
    },
    {
      "dataset": "FreedomIntelligence/HealthcareMagic"
    },
    {
      "dataset": "FreedomIntelligence/iCliniq"
    },
    {
      "dataset": "Liyuan/MedDialog"
    },
    {
      "dataset": "openmed-community/MedReason-Stenographic"
    },
    {
      "dataset": "medalpaca/medical_meadow_pubmed_causal"
    },
    {
      "dataset": "FreedomIntelligence/CoD-PatientSymDisease"
    },
    {
      "dataset": "blue-blues/medical_cot"
    },
    {
      "dataset": "bigbio/rad_qa"
    },
    {
      "dataset": "mlabonne/MedText"
    },
    {
      "dataset": "lewtun/drug-reviews"
    },
    {
      "dataset": "FreedomIntelligence/DxBench"
    },
    {
      "dataset": "stellalisy/MediQ_AskDocs_preference"
    },
    {
      "dataset": "empirischtech/med-qa-orpo-dpo"
    },
    {
      "dataset": "FreedomIntelligence/ApolloMoEDataset"
    },
    {
      "dataset": "allenai/cord19"
    },
    {
      "dataset": "mteb/raw_medrxiv"
    },
    {
      "dataset": "medalpaca/medical_meadow_cord19"
    },
    {
      "dataset": "openlifescienceai/medqa"
    },
    {
      "dataset": "lavita/MedQuAD"
    },
    {
      "dataset": "kroshan/BioASQ"
    },
    {
      "dataset": "bigbio/bioasq_task_b"
    },
    {
      "dataset": "rag-datasets/rag-mini-bioasq"
    },
    {
      "dataset": "croyer/MIMIC-III-split"
    },
    {
      "dataset": "wshi83/EHRAgent-eicu"
    },
    {
      "dataset": "Eladio/emrqa-msquad"
    },
    {
      "dataset": "louisbrulenaudet/clinical-trials"
    },
    {
      "dataset": "pankajrajdeo/Clinical_Trials"
    },
    {
      "dataset": "ravistech/clinical-trial-llm-v2"
    },
    {
      "dataset": "bigbio/n2c2_2010"
    },
    {
      "dataset": "bigbio/n2c2_2014_deid"
    },
    {
      "dataset": "bigbio/n2c2_2018_track1"
    },
    {
      "dataset": "bigbio/n2c2_2011"
    },
    {
      "dataset": "araag2/MedNLI"
    },
    {
      "dataset": "bigbio/mediqa_nli"
    },
    {
      "dataset": "curaihealth/medical_questions_pairs"
    },
    {
      "dataset": "agenticx/DrugBank"
    },
    {
      "dataset": "SkyHuReal/DrugBank-Alpaca"
    },
    {
      "dataset": "antoinebcx/smiles-molecules-chembl"
    },
    {
      "dataset": "eve-bio/drug-target-activity"
    },
    {
      "dataset": "StanfordAIMI/stanford-deidentifier-only-i2b2"
    }
  ]
}