{
  "self_prediction_willingness": {
    "100_word_corpus": {
      "models_self_predicting": 5,
      "total_models": 10,
      "observed_rate": 0.5,
      "expected_rate": 0.5,
      "p_value": 0.623046875,
      "significant_at_05": false,
      "interpretation": "Only 5/10 models ever predicted themselves"
    },
    "500_word_corpus": {
      "models_self_predicting": 4,
      "total_models": 10,
      "observed_rate": 0.4,
      "expected_rate": 0.5,
      "p_value": 0.376953125,
      "significant_at_05": false,
      "interpretation": "Only 4/10 models ever predicted themselves"
    }
  },
  "exact_prediction_accuracy": {
    "100_word_corpus": {
      "correct_predictions": 103,
      "total_predictions": 1000,
      "observed_accuracy": 0.103,
      "random_baseline": 0.1,
      "p_value": 0.7517199988983746,
      "significant_at_05": false,
      "interpretation": "Accuracy 10.3% vs 10.0% baseline"
    },
    "500_word_corpus": {
      "correct_predictions": 109,
      "total_predictions": 1000,
      "observed_accuracy": 0.109,
      "random_baseline": 0.1,
      "p_value": 0.3425857177113689,
      "significant_at_05": false,
      "interpretation": "Accuracy 10.9% vs 10.0% baseline"
    }
  },
  "binary_self_identification": {
    "100_word_corpus": {
      "mean_accuracy": 0.821,
      "threshold": 0.9,
      "sample_size": 100,
      "p_value": 0.010007279262125005,
      "significant_below_threshold": true,
      "interpretation": "Mean accuracy 82.1% significantly below 90.0% threshold"
    },
    "500_word_corpus": {
      "mean_accuracy": 0.723,
      "threshold": 0.9,
      "sample_size": 100,
      "p_value": 3.481426687624817e-07,
      "significant_below_threshold": true,
      "interpretation": "Mean accuracy 72.3% significantly below 90.0% threshold"
    }
  },
  "prediction_bias": {
    "observed_gpt_claude_rate": 0.977,
    "expected_gpt_claude_rate": 0.4,
    "observed_count": 977,
    "expected_count": 400,
    "chi2_statistic": 1387.2041666666667,
    "p_value": 1.267651665486498e-303,
    "significant_bias": true,
    "interpretation": "Extreme bias: 97.7% predictions to GPT/Claude vs 40.0% expected"
  },
  "confidence_intervals": {
    "exact_accuracy_100w": {
      "point_estimate": 0.103,
      "ci_lower": 0.08565481000508716,
      "ci_upper": 0.1233836362324436,
      "interpretation": "10.3% (95% CI: 8.6%-12.3%)"
    },
    "exact_accuracy_500w": {
      "point_estimate": 0.109,
      "ci_lower": 0.09116003338451377,
      "ci_upper": 0.12983249175119035,
      "interpretation": "10.9% (95% CI: 9.1%-13.0%)"
    },
    "binary_accuracy_100w": {
      "point_estimate": 0.821,
      "ci_lower": 0.7333264161369926,
      "ci_upper": 0.8829977450105364,
      "interpretation": "82.1% (95% CI: 73.3%-88.3%)"
    },
    "binary_accuracy_500w": {
      "point_estimate": 0.723,
      "ci_lower": 0.6251197129007884,
      "ci_upper": 0.7986031478881379,
      "interpretation": "72.3% (95% CI: 62.5%-79.9%)"
    }
  }
}