{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a10f63f6-8b77-4167-88cf-d19c8cd656bf",
   "metadata": {},
   "outputs": [],
   "source": [
    "from joblib import Parallel, delayed  # for parallelization\n",
    "from tqdm import tqdm  # for progress bars\n",
    "from utils import *"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "c7c7735a-a51b-4251-ae3d-d1ea118453fa",
   "metadata": {},
   "source": [
    "# Code reproducibility instructions\n",
    "Do the following steps in order\n",
    "\n",
    "- (1) In the following chunk named \"SELLERS SIZE\", select the number of sellers N = 2. \n",
    "- (2) Run the next chunk named \"RUN SIMULATION FOR N\". \n",
    "- (3) Repet (1) and (2) with N = 4\n",
    "- (4) Repet (1) and (2) with N = 6\n",
    "- (5) Run the chunk \"Merge the 3 plots together for a ALL N\" to "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9a90da50-5b87-46ed-b91e-2c46bc1e0650",
   "metadata": {},
   "outputs": [],
   "source": [
    "## SELLERS SIZE ##\n",
    "N = 2  # number of players/components N = 2, 4, or 6"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8c013bbf-777d-4c9a-9557-ac34a57c9659",
   "metadata": {},
   "outputs": [],
   "source": [
    "## RUN SIMULATION FOR N ##\n",
    "\n",
    "# Define experiment parameters\n",
    "T_values = [100, 400, 800, 1600, 3200]\n",
    "num_runs = 30  # number of repetitions per T\n",
    "rng_master = np.random.default_rng(123)  # master RNG for reproducibility\n",
    "\n",
    "run_parallel = True\n",
    "\n",
    "\n",
    "# Boundaries for p (for each coordinate)\n",
    "p_m_arr = [0] * N\n",
    "p_M_arr = [3] * N\n",
    "\n",
    "# Define the \"true\" psi_i functions (for data generation & regret measurement)\n",
    "psi = []\n",
    "\n",
    "if N == 8:\n",
    "    for i in range(N):\n",
    "        psi.append(lambda w, i=i: norm.cdf(3*w/(i+1)))  # using default argument to fix i\n",
    "else:\n",
    "    for i in range(N):\n",
    "        #Each psi_i is defined as norm.cdf(w - i)\n",
    "        psi.append(lambda w, i=i: norm.cdf(2*w/(i+1)))  # using default argument to fix i\n",
    "        #psi.append(lambda w, i=i: 1-np.exp(-w/(i+1)))\n",
    "\n",
    "# Define the true theta for each component\n",
    "if N ==2:\n",
    "    beta_i = 0.8\n",
    "\n",
    "if N ==4:\n",
    "    beta_i = 0.92\n",
    "\n",
    "if N ==6:\n",
    "    beta_i = 0.97\n",
    "    \n",
    "if N ==8:\n",
    "    beta_i = 0.97\n",
    "\n",
    "theta_true = []\n",
    "for i in range(N):\n",
    "    theta = np.ones(N)\n",
    "    theta[i] = -beta_i\n",
    "    # For j != i, set them to sqrt((1-beta_i^2)/(N-1))\n",
    "    for j in range(N):\n",
    "        if j != i:\n",
    "            theta[j] = np.sqrt((1-beta_i**2)/(N-1))\n",
    "    theta_true.append(theta)\n",
    "\n",
    "# Compute p* (the optimal p vector) via a fixed-point iteration\n",
    "p_initial = [p_M_arr[i] / 2 for i in range(N)]\n",
    "error = 100\n",
    "while error > 0.0001:\n",
    "    p_t = []\n",
    "    for i in range(N):\n",
    "        b_i = theta_true[i][i]\n",
    "        gamma_i = np.delete(theta_true[i], i)\n",
    "        p_minus_i = np.delete(p_initial, i)\n",
    "        q_i = p_minus_i @ gamma_i\n",
    "        p_t.append(p_opt(psi[i], b_i, q_i, p_m_arr[i], p_M_arr[i]))\n",
    "    error = np.linalg.norm(np.array(p_initial) - np.array(p_t), 2)\n",
    "    #print(\"Fixed-point error:\", error)\n",
    "    p_initial = p_t\n",
    "\n",
    "p_star = p_initial  # optimal p vector\n",
    "print(p_star)\n",
    "#p_star = [-1/theta_true[i][i] for n in range(N)]\n",
    "\n",
    "print(f\"\\nRunning experiments for N = {2} beta_i = {beta_i}\")\n",
    "\n",
    "mean_theta_diffs = []\n",
    "ci_theta_diffs = []\n",
    "mean_p_diffs = []\n",
    "ci_p_diffs = []\n",
    "mean_regrets = []\n",
    "ci_regrets = []\n",
    "mean_l2_errors = []\n",
    "ci_l2_errors = []\n",
    "\n",
    "for T in T_values:\n",
    "    print(f\"\\nRunning experiments for T = {T}\")\n",
    "    seeds = rng_master.integers(1_000_000, size=num_runs)\n",
    "    if run_parallel == True:\n",
    "        results = Parallel(n_jobs=-1)(\n",
    "            delayed(single_run_experiment)(T, N, seed, p_m_arr, p_M_arr, psi, theta_true, p_star, p_initial)\n",
    "            for seed in tqdm(seeds, desc=f\"Repetitions for T={T}\", leave=False)\n",
    "        )\n",
    "    else:\n",
    "        results = []\n",
    "        for seed in seeds:\n",
    "            results.append(single_run_experiment(T, seed))\n",
    "    \n",
    "    run_theta_diffs = np.array([r[0] for r in results])\n",
    "    run_l2_errors   = np.array([r[1] for r in results])\n",
    "    run_p_diffs     = np.array([r[2] for r in results])\n",
    "    run_total_regret= np.array([r[3] for r in results])\n",
    "    \n",
    "    def mean_ci(a):\n",
    "        m = np.nanmean(a)\n",
    "        s = np.nanstd(a, ddof=1)\n",
    "        c = 1.96 * s / np.sqrt(num_runs)\n",
    "        return m, c\n",
    "\n",
    "    mean_theta, ci_theta = mean_ci(run_theta_diffs)\n",
    "    mean_p,     ci_p     = mean_ci(run_p_diffs)\n",
    "    mean_r,     ci_r     = mean_ci(run_total_regret)\n",
    "    mean_l2,    ci_l2    = mean_ci(run_l2_errors)\n",
    "    \n",
    "    mean_theta_diffs.append(mean_theta)\n",
    "    ci_theta_diffs.append(ci_theta)\n",
    "    mean_p_diffs.append(mean_p)\n",
    "    ci_p_diffs.append(ci_p)\n",
    "    mean_regrets.append(mean_r)\n",
    "    ci_regrets.append(ci_r)\n",
    "    mean_l2_errors.append(mean_l2)\n",
    "    ci_l2_errors.append(ci_l2)\n",
    "    \n",
    "    print(f\"\\n[T={T}] Results over {num_runs} runs:\")\n",
    "    print(f\"   Sum(||theta_hat - theta_true||): {mean_theta:.3f} ± {ci_theta:.3f}\")\n",
    "    print(f\"   L2 Error (Isotonic via LS): {mean_l2:.5f} ± {ci_l2:.5f}\")\n",
    "    print(f\"   ||p_T - p^*||: {mean_p:.3f} ± {ci_p:.3f}\")\n",
    "    print(f\"   Total Regret: {mean_r:.3f} ± {ci_r:.3f}\")\n",
    "\n",
    "# SAVE DATA\n",
    "data_folder = \"DATA\"\n",
    "os.makedirs(data_folder, exist_ok=True)\n",
    "\n",
    "# Save data as a CSV file\n",
    "data_file = os.path.join(data_folder, f\"data_N_{N}.csv\")\n",
    "\n",
    "# Create a DataFrame with all the relevant data\n",
    "data_df = pd.DataFrame({\n",
    "    \"T_values\": T_values,\n",
    "    \"mean_theta_diffs\": mean_theta_diffs,\n",
    "    \"ci_theta_diffs\": ci_theta_diffs,\n",
    "    \"mean_l2_errors\": mean_l2_errors,\n",
    "    \"ci_l2_errors\": ci_l2_errors,\n",
    "    \"mean_p_diffs\": mean_p_diffs,\n",
    "    \"ci_p_diffs\": ci_p_diffs,\n",
    "    \"mean_regrets\": mean_regrets,\n",
    "    \"ci_regrets\": ci_regrets\n",
    "})\n",
    "\n",
    "# Save the data\n",
    "data_df.to_csv(data_file, index=False)\n",
    "print(f\"Data saved successfully to {data_file}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1296592d-94a9-41e2-aba6-4baa47cfa2b3",
   "metadata": {},
   "outputs": [],
   "source": [
    "plot_all()\n",
    "plot_all_slopes()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d1bf191c-23ca-4093-bb7a-3a2f39f97615",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ce72adb8-dfde-4ad5-93ff-dc330355ece0",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
