{"task_name": "piqa:mc", "task_hash": "3692c0fd172e26cd97e4a75b14cf257e", "task_config": {"task_name": "piqa:mc", "task_core": "piqa", "limit": 1000000, "split": "validation", "num_shots": 5, "fewshot_seed": 1234, "primary_metric": "acc_raw", "random_subsample_seed": 1234, "context_kwargs": {}, "generation_kwargs": {}, "metric_kwargs": {}, "native_id_field": "index", "fewshot_source": "OLMES:piqa", "dataset_path": "piqa", "dataset_name": null, "use_chat_format": null, "version": 0, "revision": null, "metadata": {"regimes": ["OLMES-v0.1"], "alias": "piqa:mc::olmes"}}, "current_date": "2024-11-18 22:10:00 UTC", "num_instances": 1838}