{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "cae5de21",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Parameters: n=30, ρ=0.15, samples=100000, seed=42\n",
      "--------------------------------------------------\n",
      "Theoretical Noise Stability: 0.500000\n",
      "Empirical Noise Stability:   0.500210\n"
     ]
    }
   ],
   "source": [
    "import random\n",
    "import numpy as np\n",
    "\n",
    "def estimate_noise_stability_consistent(n, rho, num_samples, seed=None):\n",
    "    if seed is not None:\n",
    "        random.seed(seed)\n",
    "        np.random.seed(seed)\n",
    "    \n",
    "    # We will compute f(x) and f(y) differently depending on if x == y.\n",
    "    # We don't need a truth table because we only care if f(x) == f(y).\n",
    "    \n",
    "    matching_outputs_count = 0\n",
    "    for _ in range(num_samples):\n",
    "        # Generate a random input x and its noisy version y\n",
    "        x = np.random.randint(2, size=n)\n",
    "        y = np.copy(x)\n",
    "        noise_mask = np.random.uniform(0, 1, size=n) > rho\n",
    "        y[noise_mask] = 1 - y[noise_mask]\n",
    "\n",
    "        if np.array_equal(x, y):\n",
    "            # If inputs are identical, outputs MUST be identical\n",
    "            matching_outputs_count += 1\n",
    "        else:\n",
    "            # If inputs are different, outputs are independent coin flips\n",
    "            if random.randint(0, 1) == random.randint(0, 1):\n",
    "                matching_outputs_count += 1\n",
    "                \n",
    "    return matching_outputs_count / num_samples\n",
    "\n",
    "# --- Main script to run the experiment ---\n",
    "if __name__ == \"__main__\":\n",
    "    n_vars = 30\n",
    "    rho_val = 0.15\n",
    "    samples = 100_000\n",
    "    seed_val = 42\n",
    "\n",
    "    theoretical_stability = 0.5 * (rho_val ** n_vars) + 0.5\n",
    "    empirical_stability = estimate_noise_stability_consistent(n_vars, rho_val, samples, seed=seed_val)\n",
    "\n",
    "    print(f\"Parameters: n={n_vars}, ρ={rho_val}, samples={samples}, seed={seed_val}\")\n",
    "    print(\"--------------------------------------------------\")\n",
    "    print(f\"Theoretical Noise Stability: {theoretical_stability:.6f}\")\n",
    "    print(f\"Empirical Noise Stability:   {empirical_stability:.6f}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "9b12f078",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Parameters: n=8, ρ=0.8, samples=500000, seed=42\n",
      "--------------------------------------------------\n",
      "Theoretical Noise Stability: 0.820000\n",
      "Empirical Noise Stability:   0.679632\n"
     ]
    }
   ],
   "source": [
    "import random\n",
    "import numpy as np\n",
    "\n",
    "def noise_stability_parity_k2(n, rho, num_samples, seed=None):\n",
    "    \"\"\"\n",
    "    Estimates the noise stability of a sparse parity function with k=2.\n",
    "\n",
    "    Args:\n",
    "        n (int): The total number of variables (>=2).\n",
    "        rho (float): The noise parameter (correlation).\n",
    "        num_samples (int): The number of samples for the estimation.\n",
    "        seed (int, optional): A seed for reproducibility.\n",
    "    \n",
    "    Returns:\n",
    "        float: The empirically calculated noise stability.\n",
    "    \"\"\"\n",
    "    if seed is not None:\n",
    "        random.seed(seed)\n",
    "        np.random.seed(seed)\n",
    "\n",
    "    # The sparse parity function with k=2, using the first two bits\n",
    "    f_parity = lambda x: (x[0] + x[1]) % 2\n",
    "\n",
    "    matching_outputs_count = 0\n",
    "    for _ in range(num_samples):\n",
    "        # Generate a random input x\n",
    "        x = np.random.randint(2, size=n)\n",
    "        \n",
    "        # Generate a noisy version y of x\n",
    "        y = np.copy(x)\n",
    "        noise_mask = np.random.uniform(0, 1, size=n) > rho\n",
    "        y[noise_mask] = 1 - y[noise_mask]\n",
    "        \n",
    "        # Apply the function to both inputs and check for a match\n",
    "        if f_parity(x) == f_parity(y):\n",
    "            matching_outputs_count += 1\n",
    "            \n",
    "    return matching_outputs_count / num_samples\n",
    "\n",
    "# --- Main script to run the experiment ---\n",
    "if __name__ == \"__main__\":\n",
    "    n_vars = 8\n",
    "    rho_val = 0.8\n",
    "    samples = 500_000\n",
    "    seed_val = 42\n",
    "\n",
    "    # Calculate the theoretical noise stability for k=2 parity\n",
    "    theoretical_stability = (1 + rho_val**2) / 2\n",
    "\n",
    "    # Estimate the noise stability using the function\n",
    "    empirical_stability = noise_stability_parity_k2(n_vars, rho_val, samples, seed=seed_val)\n",
    "\n",
    "    # Print the results\n",
    "    print(f\"Parameters: n={n_vars}, ρ={rho_val}, samples={samples}, seed={seed_val}\")\n",
    "    print(\"--------------------------------------------------\")\n",
    "    print(f\"Theoretical Noise Stability: {theoretical_stability:.6f}\")\n",
    "    print(f\"Empirical Noise Stability:   {empirical_stability:.6f}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "b2921b2e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "rho=0.50 | Stab emp=0.0667, th=0.2500 | Match emp=0.5333, th=0.6250\n"
     ]
    }
   ],
   "source": [
    "import numpy as np\n",
    "\n",
    "def estimate_k2_xor_stability(n=8, rho=0.8, num_samples=200_000, seed=42):\n",
    "    rng = np.random.default_rng(seed)\n",
    "    # Flip probability per bit that yields correlation rho in ±1 space\n",
    "    eps = (1.0 - rho) / 2.0\n",
    "\n",
    "    # Sample X in {0,1}^n and construct Y by flipping bits with prob eps\n",
    "    X = rng.integers(0, 2, size=(num_samples, n))\n",
    "    flips = rng.random(size=(num_samples, n)) < eps\n",
    "    Y = X ^ flips.astype(np.int64)\n",
    "\n",
    "    # 2-sparse XOR on first two bits (any fixed pair works)\n",
    "    fX_01 = (X[:, 0] ^ X[:, 1])          # in {0,1}\n",
    "    fY_01 = (Y[:, 0] ^ Y[:, 1])          # in {0,1}\n",
    "\n",
    "    # Convert to ±1 for noise stability E[f(X)f(Y)]\n",
    "    gX = 2 * fX_01 - 1\n",
    "    gY = 2 * fY_01 - 1\n",
    "    stab_empirical = np.mean(gX * gY)\n",
    "\n",
    "    # Also compute match probability\n",
    "    match_empirical = np.mean(fX_01 == fY_01)\n",
    "\n",
    "    # Theoretical values\n",
    "    stab_theoretical = rho ** 2\n",
    "    match_theoretical = (1.0 + stab_theoretical) / 2.0\n",
    "\n",
    "    return {\n",
    "        \"stab_empirical\": stab_empirical,\n",
    "        \"stab_theoretical\": stab_theoretical,\n",
    "        \"match_empirical\": match_empirical,\n",
    "        \"match_theoretical\": match_theoretical,\n",
    "    }\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    for rho in [0.5]:\n",
    "        res = estimate_k2_xor_stability(n=15, rho=rho, num_samples=30, seed=123)\n",
    "        print(f\"rho={rho:0.2f} | Stab emp={res['stab_empirical']:.4f}, th={res['stab_theoretical']:.4f} | \"\n",
    "              f\"Match emp={res['match_empirical']:.4f}, th={res['match_theoretical']:.4f}\")"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
