{"description": "Measuring Massive Multitask Language Understanding by Dan Hendrycks, Collin Burns, Steven Basart, Andy Zou, Mantas Mazeika, Dawn Song, and Jacob Steinhardt (ICLR 2021).\n", "citation": "@article{hendryckstest2021,\n  title={Measuring Massive Multitask Language Understanding},\n  author={Dan Hendrycks and Collin Burns and Steven Basart and Andy Zou and Mantas Mazeika and Dawn Song and Jacob Steinhardt},\n  journal={Proceedings of the International Conference on Learning Representations (ICLR)},\n  year={2021}\n}\n", "homepage": "https://github.com/hendrycks/test", "license": "MIT", "features": {"question": {"dtype": "string", "_type": "Value"}, "A": {"dtype": "string", "_type": "Value"}, "B": {"dtype": "string", "_type": "Value"}, "C": {"dtype": "string", "_type": "Value"}, "D": {"dtype": "string", "_type": "Value"}, "answer": {"dtype": "string", "_type": "Value"}}, "builder_name": "mmlu", "dataset_name": "mmlu", "config_name": "medical_genetics", "version": {"version_str": "1.0.0", "major": 1, "minor": 0, "patch": 0}, "splits": {"test": {"name": "test", "num_bytes": 20021, "num_examples": 99, "dataset_name": "mmlu"}, "validation": {"name": "validation", "num_bytes": 2590, "num_examples": 10, "dataset_name": "mmlu"}, "train": {"name": "train", "num_bytes": 854, "num_examples": 4, "dataset_name": "mmlu"}}, "download_checksums": {"mmlu.zip": {"num_bytes": 2336375, "checksum": null}}, "download_size": 2336375, "dataset_size": 23465, "size_in_bytes": 2359840}