{
    "config": {
        "model": {
            "name": "embed-1d"
        },
        "task": {
            "name": "plumpuddingcdf",
            "possible_shift_variables": [
                "a",
                "b",
                "c",
                "d",
                "e"
            ]
        },
        "baseline": {
            "model": {
                "name": "gpt-4",
                "batch_size": 1,
                "prompt": "Answer the following question. [question] You must give a simple yes or no answer.",
                "free_response_prompt": "[question]",
                "cot": false
            },
            "explanation": {
                "name": "instructedrevealscores",
                "requires_model_queries": false
            },
            "embedder": {
                "name": "GloVe"
            },
            "retriever": {
                "name": "nearest_neighbor"
            },
            "name": "llm_instructedrevealscores",
            "class_name": "llm_prompting",
            "n_shot": 10,
            "test_questions": 10,
            "seed": 0
        },
        "distributional_shift": {
            "name": "new_combinations",
            "train_variables": 5,
            "new_values": 3
        },
        "dataset_construction": {
            "templates_per_topic": 15,
            "train_questions_per_template": 500,
            "test_questions_per_template": 50
        }
    },
    "n_templates_evaluated": 15,
    "templates_evaluated": [
        "plumpuddingcdf_10",
        "plumpuddingcdf_7",
        "plumpuddingcdf_13",
        "plumpuddingcdf_3",
        "plumpuddingcdf_9",
        "plumpuddingcdf_4",
        "plumpuddingcdf_14",
        "plumpuddingcdf_6",
        "plumpuddingcdf_1",
        "plumpuddingcdf_11",
        "plumpuddingcdf_15",
        "plumpuddingcdf_5",
        "plumpuddingcdf_8",
        "plumpuddingcdf_2",
        "plumpuddingcdf_12"
    ],
    "results": {
        "log_score": -0.490093656270072,
        "normalized_log_score": -0.15449239894156477,
        "kl_divergence": 0.15449239894156477,
        "accuracy": 0.8066666666666666,
        "tv_distance": 0.15666405786494977
    }
}