{
    "config": {
        "model": {
            "name": "vicuna-7b-v1.3",
            "batch_size": 32,
            "prompt": "A chat between a curious user and an artificial intelligence assistant. The assistant always gives simple Yes or No answer to the user's questions. USER: [question]\nASSISTANT: Answer:",
            "cot": false,
            "free_response_prompt": "A chat between a curious human and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the human's questions.\n\nUSER: [question]\nASSISTANT:",
            "dataset_model_name": "vicuna-7b-v1.3"
        },
        "task": {
            "name": "hiring_decisions",
            "possible_shift_variables": [
                "e"
            ]
        },
        "baseline": {
            "explanation": {
                "name": "spamchar",
                "requires_model_queries": false
            },
            "embedder": {
                "name": "GloVe"
            },
            "retriever": {
                "name": "nearest_neighbor"
            },
            "name": "distill_spamchar",
            "class_name": "distillation",
            "model_name": "microsoft/deberta-v3-base",
            "train_epochs": 5,
            "batch_size": 16,
            "n_shot": 3,
            "test_on_train_data": true,
            "seed": 0
        },
        "distributional_shift": {
            "name": "new_combinations",
            "train_variables": 5,
            "new_values": 3
        },
        "dataset_construction": {
            "templates_per_topic": 15,
            "train_questions_per_template": 500,
            "test_questions_per_template": 50
        }
    },
    "n_templates_evaluated": 15,
    "templates_evaluated": [
        "hiring_decisions_184",
        "hiring_decisions_571",
        "hiring_decisions_951",
        "hiring_decisions_131",
        "hiring_decisions_77",
        "hiring_decisions_32",
        "hiring_decisions_256",
        "hiring_decisions_247",
        "hiring_decisions_54",
        "hiring_decisions_700",
        "hiring_decisions_366",
        "hiring_decisions_725",
        "hiring_decisions_962",
        "hiring_decisions_912",
        "hiring_decisions_250"
    ],
    "results": {
        "log_score": -0.7646806955650473,
        "normalized_log_score": -0.2570852955646018,
        "kl_divergence": 0.2570852955646018,
        "accuracy": 0.6613333333333333,
        "tv_distance": 0.2232016526156683
    },
    "results_on_train_data": {
        "log_score": -0.5082108410128938,
        "normalized_log_score": -0.03946462624456666,
        "kl_divergence": 0.03946462624456666,
        "accuracy": 0.9325333333333332,
        "tv_distance": 0.07317590418110614
    }
}