{
    "config": {
        "model": {
            "name": "baseline_tests"
        },
        "task": {
            "name": "test_offset"
        },
        "baseline": {
            "embedder": {
                "name": "none"
            },
            "retriever": {
                "name": "none"
            },
            "explanation": {
                "name": "none",
                "requires_model_queries": false
            },
            "name": "predict_average",
            "class_name": "predict_average"
        },
        "distributional_shift": {
            "name": "new_combinations",
            "train_variables": 5,
            "new_values": 3
        },
        "dataset_construction": {
            "baseline_filter": {
                "tv_distance_threshold": 0.0,
                "log_score_threshold": -0.7
            },
            "templates_per_topic": 1,
            "train_questions_per_template": 200,
            "test_questions_per_template": 30
        }
    },
    "n_templates_evaluated": 1,
    "templates_evaluated": [
        "moral_dilemmas_35"
    ],
    "results": {
        "log_score": -0.769816477872714,
        "normalized_log_score": -0.37221026277029795,
        "kl_divergence": 0.37221026277029795,
        "accuracy": 0.504,
        "tv_distance": 0.2808487877304237
    }
}