LICENSE.md
README.md
setup.py
lm_eval/__init__.py
lm_eval/base.py
lm_eval/evaluator.py
lm_eval/metrics.py
lm_eval/utils.py
lm_eval.egg-info/PKG-INFO
lm_eval.egg-info/SOURCES.txt
lm_eval.egg-info/dependency_links.txt
lm_eval.egg-info/requires.txt
lm_eval.egg-info/top_level.txt
lm_eval/datasets/__init__.py
lm_eval/datasets/asdiv/__init__.py
lm_eval/datasets/asdiv/asdiv.py
lm_eval/datasets/coqa/__init__.py
lm_eval/datasets/coqa/coqa.py
lm_eval/datasets/drop/__init__.py
lm_eval/datasets/drop/drop.py
lm_eval/datasets/headqa/__init__.py
lm_eval/datasets/headqa/headqa.py
lm_eval/datasets/hendrycks_ethics/__init__.py
lm_eval/datasets/hendrycks_ethics/hendrycks_ethics.py
lm_eval/datasets/hendrycks_math/__init__.py
lm_eval/datasets/hendrycks_math/hendrycks_math.py
lm_eval/datasets/logiqa/__init__.py
lm_eval/datasets/logiqa/logiqa.py
lm_eval/datasets/mutual/__init__.py
lm_eval/datasets/mutual/mutual.py
lm_eval/datasets/pile/__init__.py
lm_eval/datasets/pile/pile.py
lm_eval/datasets/quac/__init__.py
lm_eval/datasets/quac/quac.py
lm_eval/datasets/sat_analogies/__init__.py
lm_eval/datasets/sat_analogies/sat_analogies.py
lm_eval/datasets/triviaqa/__init__.py
lm_eval/datasets/triviaqa/triviaqa.py
lm_eval/datasets/unscramble/__init__.py
lm_eval/datasets/unscramble/unscramble.py
lm_eval/decontamination/__init__.py
lm_eval/decontamination/archiver.py
lm_eval/decontamination/decontaminate.py
lm_eval/decontamination/janitor.py
lm_eval/models/__init__.py
lm_eval/models/dummy.py
lm_eval/models/gpt2.py
lm_eval/models/gpt3.py
lm_eval/models/huggingface.py
lm_eval/models/textsynth.py
lm_eval/tasks/__init__.py
lm_eval/tasks/anli.py
lm_eval/tasks/arc.py
lm_eval/tasks/arithmetic.py
lm_eval/tasks/asdiv.py
lm_eval/tasks/blimp.py
lm_eval/tasks/cbt.py
lm_eval/tasks/coqa.py
lm_eval/tasks/crowspairs.py
lm_eval/tasks/drop.py
lm_eval/tasks/glue.py
lm_eval/tasks/gsm8k.py
lm_eval/tasks/headqa.py
lm_eval/tasks/hellaswag.py
lm_eval/tasks/hendrycks_ethics.py
lm_eval/tasks/hendrycks_math.py
lm_eval/tasks/hendrycks_test.py
lm_eval/tasks/lambada.py
lm_eval/tasks/lambada_cloze.py
lm_eval/tasks/lambada_multilingual.py
lm_eval/tasks/logiqa.py
lm_eval/tasks/mathqa.py
lm_eval/tasks/mc_taco.py
lm_eval/tasks/mutual.py
lm_eval/tasks/naturalqs.py
lm_eval/tasks/openbookqa.py
lm_eval/tasks/pile.py
lm_eval/tasks/piqa.py
lm_eval/tasks/prost.py
lm_eval/tasks/pubmedqa.py
lm_eval/tasks/qa4mre.py
lm_eval/tasks/qasper.py
lm_eval/tasks/quac.py
lm_eval/tasks/race.py
lm_eval/tasks/sat.py
lm_eval/tasks/sciq.py
lm_eval/tasks/squad.py
lm_eval/tasks/storycloze.py
lm_eval/tasks/superglue.py
lm_eval/tasks/swag.py
lm_eval/tasks/toxigen.py
lm_eval/tasks/translation.py
lm_eval/tasks/triviaqa.py
lm_eval/tasks/truthfulqa.py
lm_eval/tasks/unscramble.py
lm_eval/tasks/webqs.py
lm_eval/tasks/wikitext.py
lm_eval/tasks/winogrande.py
lm_eval/tasks/wsc273.py
scripts/__init__.py
scripts/cost_estimate.py
scripts/get_prompts.py
scripts/make_gpt2_test_cases.py
scripts/make_table_tasks.py
scripts/write_out.py
scripts/clean_training_data/__init__.py
scripts/clean_training_data/compress_and_package.py
scripts/clean_training_data/generate_13_grams.py
scripts/clean_training_data/investigate_pile.py
scripts/clean_training_data/process_sorted_buckets.py
scripts/clean_training_data/sort_13_gram_buckets.py