{
    "config": {
        "model": {
            "name": "flan-alpaca-gpt4-xl",
            "batch_size": 32,
            "prompt": "Answer the following yes/no question. [question]",
            "free_response_prompt": "[question]",
            "cot": false,
            "dataset_model_name": "flan-alpaca-gpt4-xl"
        },
        "task": {
            "name": "moral_dilemmas",
            "possible_shift_variables": [
                "a",
                "b",
                "c",
                "d",
                "e"
            ]
        },
        "baseline": {
            "explanation": {
                "name": "counterfactual",
                "requires_model_queries": false
            },
            "embedder": {
                "name": "GloVe"
            },
            "retriever": {
                "name": "nearest_neighbor"
            },
            "name": "distill_counterfactual",
            "class_name": "distillation",
            "model_name": "microsoft/deberta-v3-base",
            "train_epochs": 5,
            "batch_size": 16,
            "n_shot": 3,
            "seed": 0
        },
        "distributional_shift": {
            "name": "new_combinations",
            "train_variables": 5,
            "new_values": 3
        },
        "dataset_construction": {
            "templates_per_topic": 15,
            "train_questions_per_template": 500,
            "test_questions_per_template": 50
        }
    },
    "n_templates_evaluated": 15,
    "templates_evaluated": [
        "moral_dilemmas_371",
        "moral_dilemmas_395",
        "moral_dilemmas_421",
        "moral_dilemmas_112",
        "moral_dilemmas_410",
        "moral_dilemmas_35",
        "moral_dilemmas_197",
        "moral_dilemmas_270",
        "moral_dilemmas_158",
        "moral_dilemmas_109",
        "moral_dilemmas_331",
        "moral_dilemmas_390",
        "moral_dilemmas_289",
        "moral_dilemmas_199",
        "moral_dilemmas_530"
    ],
    "results": {
        "log_score": -0.6856828818400279,
        "normalized_log_score": -0.1475855102373353,
        "kl_divergence": 0.1475855102373353,
        "accuracy": 0.6626666666666666,
        "tv_distance": 0.19847241065051782
    }
}