{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e6c6951b-14c0-45bc-a225-6882fb6f3c50",
   "metadata": {},
   "outputs": [],
   "source": [
    "from joblib import Parallel, delayed  # for parallelization\n",
    "from tqdm import tqdm  # for progress bars\n",
    "from utils import *"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d9b7c3b1-10a0-4acc-bbd1-966f887e1a3a",
   "metadata": {},
   "source": [
    "# Code reproducibility instructions\n",
    "Do the following steps in order\n",
    "\n",
    "- (1) In the following chunk named \"SELLERS SIZE\", select the number of sellers N = 2. \n",
    "- (2) Run the next chunk named \"RUN SIMULATION FOR N\". \n",
    "- (3) Repet (1) and (2) with N = 4\n",
    "- (4) Repet (1) and (2) with N = 6\n",
    "- (5) Run the chunk \"Merge the 3 plots together for a ALL N\" to "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "86b7ab47-b394-42b7-b9f4-a87ba04c2eb0",
   "metadata": {},
   "outputs": [],
   "source": [
    "## SELLERS SIZE ##\n",
    "N = 2  # number of players/components N = 2, 4, or 6"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8c013bbf-777d-4c9a-9557-ac34a57c9659",
   "metadata": {},
   "outputs": [],
   "source": [
    "## RUN SIMULATION FOR N ##\n",
    "\n",
    "# Define experiment parameters\n",
    "T_values = [100, 400, 800, 1600, 3200]\n",
    "num_runs = 30  # number of repetitions per T\n",
    "rng_master = np.random.default_rng(123)  # master RNG for reproducibility\n",
    "\n",
    "run_parallel = True\n",
    "\n",
    "# Boundaries for p (for each coordinate)\n",
    "p_m_arr = [0] * N\n",
    "p_M_arr = [3] * N\n",
    "\n",
    "# Define the \"true\" psi_i functions (for data generation & regret measurement)\n",
    "psi = []\n",
    "\n",
    "for i in range(N):\n",
    "    psi.append(lambda w, i=i: norm.cdf(2*w/(i+1)))  # using default argument to fix i\n",
    "\n",
    "# Define the true theta for each component\n",
    "if N ==2:\n",
    "    beta = [0.71, 0.84, 0.97]\n",
    "\n",
    "if N ==4:\n",
    "    beta = [0.87, 0.93, 0.99]\n",
    "\n",
    "if N ==6:\n",
    "    beta = [0.92, 0.955, 0.99]\n",
    "\n",
    "for beta_i in beta:\n",
    "    mean_theta_diffs = []\n",
    "    ci_theta_diffs = []\n",
    "    mean_p_diffs = []\n",
    "    ci_p_diffs = []\n",
    "    mean_regrets = []\n",
    "    ci_regrets = []\n",
    "    mean_l2_errors = []\n",
    "    ci_l2_errors = []\n",
    "\n",
    "    print(f\"\\nRunning experiments for N = {2} beta_i = {beta_i}\")\n",
    "    theta_true = []\n",
    "    for i in range(N):\n",
    "        theta = np.ones(N)\n",
    "        theta[i] = -beta_i\n",
    "        # For j != i, set them to sqrt((1-beta_i^2)/(N-1))\n",
    "        for j in range(N):\n",
    "            if j != i:\n",
    "                theta[j] = np.sqrt((1-beta_i**2)/(N-1))\n",
    "        theta_true.append(theta)\n",
    "    \n",
    "    \n",
    "    def check_sum_abs(vector, i):\n",
    "        gamma = np.delete(vector, i)\n",
    "        sum_gamma = np.sum(np.abs(gamma))\n",
    "        beta = - vector[i]\n",
    "        return sum_gamma < beta\n",
    "    \n",
    "    #for i in range(N):\n",
    "    #    print(check_sum_abs(theta_true[i], i))\n",
    "    \n",
    "    # Compute p* (the optimal p vector) via a fixed-point iteration\n",
    "    p_initial = [p_M_arr[i] / 2 for i in range(N)]\n",
    "    error = 100\n",
    "    while error > 0.0001:\n",
    "        p_t = []\n",
    "        for i in range(N):\n",
    "            b_i = theta_true[i][i]\n",
    "            gamma_i = np.delete(theta_true[i], i)\n",
    "            p_minus_i = np.delete(p_initial, i)\n",
    "            q_i = p_minus_i @ gamma_i\n",
    "            p_t.append(p_opt(psi[i], b_i, q_i, p_m_arr[i], p_M_arr[i]))\n",
    "        error = np.linalg.norm(np.array(p_initial) - np.array(p_t), 2)\n",
    "        #print(\"Fixed-point error:\", error)\n",
    "        p_initial = p_t\n",
    "    \n",
    "    p_star = p_initial  # optimal initial p vector\n",
    "    print(\"p_star = \",p_star)\n",
    "    #p_star = [-1/theta_true[i][i] for n in range(N)]\n",
    "    \n",
    "    \n",
    "    for T in T_values:\n",
    "        print(f\"\\nRunning experiments for T = {T}, for {num_runs} independent episodes\")\n",
    "        seeds = rng_master.integers(1_000_000, size=num_runs)\n",
    "        if run_parallel == True:\n",
    "            results = Parallel(n_jobs=-1)(\n",
    "                delayed(single_run_experiment)(T, N, seed, p_m_arr, p_M_arr, psi, theta_true, p_star, p_initial)\n",
    "                for seed in tqdm(seeds, desc=f\"Repetitions for T={T}\", leave=False)\n",
    "            )\n",
    "        else:\n",
    "            results = []\n",
    "            for seed in seeds:\n",
    "                results.append(single_run_experiment(T, seed))\n",
    "        \n",
    "        run_theta_diffs = np.array([r[0] for r in results])\n",
    "        run_l2_errors   = np.array([r[1] for r in results])\n",
    "        run_p_diffs     = np.array([r[2] for r in results])\n",
    "        run_total_regret= np.array([r[3] for r in results])\n",
    "        \n",
    "        def mean_ci(a):\n",
    "            m = np.nanmean(a)\n",
    "            s = np.nanstd(a, ddof=1)\n",
    "            c = 1.96 * s / np.sqrt(num_runs)\n",
    "            return m, c\n",
    "    \n",
    "        mean_theta, ci_theta = mean_ci(run_theta_diffs)\n",
    "        mean_p,     ci_p     = mean_ci(run_p_diffs)\n",
    "        mean_r,     ci_r     = mean_ci(run_total_regret)\n",
    "        mean_l2,    ci_l2    = mean_ci(run_l2_errors)\n",
    "        \n",
    "        mean_theta_diffs.append(mean_theta)\n",
    "        ci_theta_diffs.append(ci_theta)\n",
    "        mean_p_diffs.append(mean_p)\n",
    "        ci_p_diffs.append(ci_p)\n",
    "        mean_regrets.append(mean_r)\n",
    "        ci_regrets.append(ci_r)\n",
    "        mean_l2_errors.append(mean_l2)\n",
    "        ci_l2_errors.append(ci_l2)\n",
    "        \n",
    "        print(f\"\\n[T={T}] Results over {num_runs} runs:\")\n",
    "        print(f\"   Sum(||theta_hat - theta_true||): {mean_theta:.3f} ± {ci_theta:.3f}\")\n",
    "        print(f\"   L2 Error (Isotonic via LS): {mean_l2:.5f} ± {ci_l2:.5f}\")\n",
    "        print(f\"   ||p_T - p^*||: {mean_p:.3f} ± {ci_p:.3f}\")\n",
    "        print(f\"   Total Regret: {mean_r:.3f} ± {ci_r:.3f}\")\n",
    "\n",
    "    #SAVE DATA\n",
    "    data_folder = \"DATA\"\n",
    "    os.makedirs(data_folder, exist_ok=True)\n",
    "    \n",
    "    # Save data as a CSV file\n",
    "    if N == 2:\n",
    "        if beta_i == 0.71:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_1.csv\")\n",
    "        if beta_i == 0.84:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_middle.csv\")\n",
    "        if beta_i == 0.97:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_0.csv\")\n",
    "    \n",
    "    if N == 4:\n",
    "        if beta_i == 0.87:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_1.csv\")\n",
    "        if beta_i == 0.93:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_middle.csv\")\n",
    "        if beta_i == 0.99:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_0.csv\")\n",
    "    \n",
    "    if N == 6:\n",
    "        if beta_i == 0.92:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_1.csv\")\n",
    "        if beta_i == 0.955:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_middle.csv\")\n",
    "        if beta_i == 0.99:\n",
    "            data_file = os.path.join(data_folder, f\"data_N_{N}_L_0.csv\")\n",
    "    \n",
    "    \n",
    "    # Create a DataFrame with all the relevant data\n",
    "    data_df = pd.DataFrame({\n",
    "        \"T_values\": T_values,\n",
    "        \"mean_theta_diffs\": mean_theta_diffs,\n",
    "        \"ci_theta_diffs\": ci_theta_diffs,\n",
    "        \"mean_l2_errors\": mean_l2_errors,\n",
    "        \"ci_l2_errors\": ci_l2_errors,\n",
    "        \"mean_p_diffs\": mean_p_diffs,\n",
    "        \"ci_p_diffs\": ci_p_diffs,\n",
    "        \"mean_regrets\": mean_regrets,\n",
    "        \"ci_regrets\": ci_regrets\n",
    "    })\n",
    "    \n",
    "    # Save the data\n",
    "    data_df.to_csv(data_file, index=False)\n",
    "    print(f\"Data saved successfully to {data_file}\")\n",
    "save_plot(N)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d2f3a676-6b29-4248-9fae-7263aae12a76",
   "metadata": {},
   "outputs": [],
   "source": [
    "## Merge the 3 plots together for a ALL N ##\n",
    "plot_all()\n",
    "plot_all_slopes()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7ba34f04-9e24-452a-a238-7439b7454083",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a6188f00-c96f-4825-99df-2699e4a456dd",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
