{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "ab3a73ec-dadc-4448-9219-37e8c6f159ae",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pulp as pulp\n",
    "from pulp import *\n",
    "import gurobipy as gp\n",
    "from gurobipy import GRB\n",
    "import random\n",
    "import pickle\n",
    "from tqdm import tqdm\n",
    "from joblib import Parallel, delayed\n",
    "\n",
    "from EDDP_functions import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dc2eeddc-ef79-4059-96a6-a94ff7799b3d",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6bb6a541-bb14-4958-8a58-b57362543c21",
   "metadata": {},
   "outputs": [],
   "source": [
    "def test_degeneracy(P0,P1,R0,R1,T,init,alpha):\n",
    "    # solve the LP\n",
    "    n = len(R0)\n",
    "    P = [P0,P1]\n",
    "    R = [R0,R1]\n",
    "    action = range(0,2)\n",
    "    state = range(0,n)\n",
    "    horizon = range(0,T)\n",
    "    prob = LpProblem(\"LP1\", LpMaximize)\n",
    "    variables = LpVariable.dicts(\"Y\",(horizon,action,state),lowBound=0., upBound=1.)\n",
    "    for t in horizon:\n",
    "        prob += lpSum([variables[t][1][s] for s in state]) == alpha\n",
    "    for t in range(0,T-1):\n",
    "        for s in state:\n",
    "            prob += variables[t+1][0][s] + variables[t+1][1][s] == lpSum([variables[t][a][ss]*P[a][ss][s] for a in action for ss in state])\n",
    "    for s in state:\n",
    "        prob += variables[0][0][s] + variables[0][1][s] == init[s]\n",
    "    prob += lpSum([variables[t][a][s]*R[a][s] for t in horizon for a in action for s in state])\n",
    "    prob.solve(PULP_CBC_CMD(msg=1))\n",
    "    # Test regularity\n",
    "    for t in horizon:\n",
    "        count = 0\n",
    "        for s in state:\n",
    "            V1 = variables[t][1][s]\n",
    "            V2 = variables[t][0][s]\n",
    "            v1 = V1.varValue\n",
    "            v2 = V2.varValue\n",
    "            if abs(v1) > 1e-6 and abs(v2) > 1e-6:\n",
    "                count += 1\n",
    "        if count == 0:\n",
    "            return True\n",
    "    return False\n",
    "\n",
    "def lp_check_uniqueness_gurobi(\n",
    "    P0: np.ndarray,     # shape = (S,S)\n",
    "    P1: np.ndarray,     # shape = (S,S)\n",
    "    R0: np.ndarray,     # length = S\n",
    "    R1: np.ndarray,     # length = S\n",
    "    T: int,\n",
    "    init: np.ndarray,   # length = S\n",
    "    alpha: float,\n",
    "    tol: float = 1e-6\n",
    "):\n",
    "    \"\"\"\n",
    "    Build and solve the same LP in Gurobi, then test uniqueness by\n",
    "    checking that no non-basic variable has a reduced cost near zero.\n",
    "    Returns: (y_opt, obj_val, is_unique)\n",
    "    \"\"\"\n",
    "    S = len(R0)\n",
    "    action = [0,1]\n",
    "    # --- 1) build model\n",
    "    m = gp.Model()\n",
    "    m.Params.OutputFlag = 0\n",
    "    # tighten tolerances\n",
    "    m.Params.FeasibilityTol = tol\n",
    "    m.Params.OptimalityTol  = tol\n",
    "\n",
    "    # variables y[t,a,s]\n",
    "    Y = {}\n",
    "    for t in range(T):\n",
    "        for a in action:\n",
    "            for s in range(S):\n",
    "                Y[t,a,s] = m.addVar(lb=0.0, ub=1.0, name=f\"Y_{t}_{a}_{s}\")\n",
    "    m.update()\n",
    "\n",
    "    # 2) add budget constraints\n",
    "    for t in range(T):\n",
    "        m.addLConstr(\n",
    "            gp.quicksum(Y[t,1,s] for s in range(S)) == alpha,\n",
    "            name=f\"budget_{t}\"\n",
    "        )\n",
    "\n",
    "    # 3) transitions\n",
    "    for t in range(T-1):\n",
    "        for s in range(S):\n",
    "            m.addLConstr(\n",
    "                gp.quicksum(Y[t+1,a,s] for a in action)\n",
    "              - gp.quicksum(Y[t,a,ss] * (P1[ss,s] if a==1 else P0[ss,s])\n",
    "                            for a in action for ss in range(S))\n",
    "              == 0,\n",
    "                name=f\"trans_{t}_{s}\"\n",
    "            )\n",
    "\n",
    "    # 4) initial\n",
    "    for s in range(S):\n",
    "        m.addLConstr(\n",
    "            gp.quicksum(Y[0,a,s] for a in action) == init[s],\n",
    "            name=f\"init_{s}\"\n",
    "        )\n",
    "\n",
    "    # 5) objective\n",
    "    obj = gp.quicksum(\n",
    "        Y[t,a,s] * (R1[s] if a==1 else R0[s])\n",
    "        for t in range(T) for a in action for s in range(S)\n",
    "    )\n",
    "    m.setObjective(obj, GRB.MAXIMIZE)\n",
    "\n",
    "    # 6) solve\n",
    "    m.optimize()\n",
    "\n",
    "    if m.status != GRB.OPTIMAL:\n",
    "        raise RuntimeError(\"LP did not solve to optimality\")\n",
    "\n",
    "    # 7) extract solution\n",
    "    y_opt = np.zeros((T,2,S))\n",
    "    for (t,a,s), var in Y.items():\n",
    "        y_opt[t,a,s] = var.X\n",
    "\n",
    "    z_opt = m.ObjVal\n",
    "\n",
    "    # 8) test uniqueness: scan non‑basic variables\n",
    "    is_unique = True\n",
    "    for (t,a,s), var in Y.items():\n",
    "        if var.VBasis != GRB.BASIC:          # only check non‑basics\n",
    "            if abs(var.RC) < tol:            # reduced cost near zero\n",
    "                is_unique = False\n",
    "                break\n",
    "\n",
    "    return y_opt, z_opt, is_unique"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "9a53b8f7-3075-494c-b845-2e70aff60e11",
   "metadata": {},
   "source": [
    "Fully dense"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "92d52659-7920-4aff-9c98-52b533ea1f42",
   "metadata": {},
   "outputs": [],
   "source": [
    "T = 10\n",
    "time_homogenous = True\n",
    "sparse =  False\n",
    "tol = 1e-6\n",
    "myS = np.arange(5,25,5)\n",
    "\n",
    "for S in myS:\n",
    "    uniqueness_count = 0\n",
    "    degenerate_count = 0\n",
    "    d = int(S/2)\n",
    "    for _ in tqdm(range(10000)):\n",
    "        P_list, r_list, alpha_budget, init = generate_problem_data(T, S, time_homogenous, sparse, d)\n",
    "\n",
    "        P_array = np.zeros((T, S, S, 2))\n",
    "        for t in range(T):\n",
    "            P_0 = P_list[t][0]\n",
    "            P_1 = P_list[t][1]\n",
    "            P_array[t,:,:,0] = P_0\n",
    "            P_array[t,:,:,1] = P_1\n",
    "        r_array = np.zeros((T, 2*S))\n",
    "        for t_ in range(T):\n",
    "            r_array[t_,:] = r_list[t_]\n",
    "      \n",
    "        P0 = P_list[0][0]\n",
    "        P1 = P_list[0][1]\n",
    "        R0 = np.zeros(S)\n",
    "        R1 = np.zeros(S)\n",
    "        for s in range(S):\n",
    "            R0[s] = r_list[0][2*s]\n",
    "            R1[s] = r_list[0][2*s+1]\n",
    "        alpha = alpha_budget[0]\n",
    "        is_degenerate = test_degeneracy(P0, P1, R0, R1, T, init, alpha)\n",
    "        \n",
    "        is_unique = lp_check_uniqueness_gurobi(P0, P1, R0, R1, T, init, alpha, tol)[2]\n",
    "        \n",
    "        if is_unique:\n",
    "            uniqueness_count += 1\n",
    "        if is_degenerate:\n",
    "            degenerate_count += 1\n",
    "        \n",
    "    print(f\"S = {S} and sparse = {sparse}:\")\n",
    "    print(f\"uniqueness_count is {uniqueness_count} out of 10000\")\n",
    "    print(f\"degenerate_count is {degenerate_count} out of 10000\")\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "342da6dc-ec1e-4a24-9b4a-2fa38070ac0e",
   "metadata": {},
   "source": [
    "Half sparse"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "33d00a52-05eb-456a-8dea-446eb6b0a4f3",
   "metadata": {},
   "outputs": [],
   "source": [
    "T = 10\n",
    "time_homogenous = True\n",
    "sparse =  True\n",
    "tol = 1e-6\n",
    "myS = np.arange(5,25,5)\n",
    "\n",
    "for S in myS:\n",
    "    uniqueness_count = 0\n",
    "    degenerate_count = 0\n",
    "    d = int(S/2)\n",
    "    for _ in tqdm(range(10000)):\n",
    "        P_list, r_list, alpha_budget, init = generate_problem_data(T, S, time_homogenous, sparse, d)\n",
    "\n",
    "        P_array = np.zeros((T, S, S, 2))\n",
    "        for t in range(T):\n",
    "            P_0 = P_list[t][0]\n",
    "            P_1 = P_list[t][1]\n",
    "            P_array[t,:,:,0] = P_0\n",
    "            P_array[t,:,:,1] = P_1\n",
    "        r_array = np.zeros((T, 2*S))\n",
    "        for t_ in range(T):\n",
    "            r_array[t_,:] = r_list[t_]\n",
    "      \n",
    "        P0 = P_list[0][0]\n",
    "        P1 = P_list[0][1]\n",
    "        R0 = np.zeros(S)\n",
    "        R1 = np.zeros(S)\n",
    "        for s in range(S):\n",
    "            R0[s] = r_list[0][2*s]\n",
    "            R1[s] = r_list[0][2*s+1]\n",
    "        alpha = alpha_budget[0]\n",
    "        is_degenerate = test_degeneracy(P0, P1, R0, R1, T, init, alpha)\n",
    "        \n",
    "        is_unique = lp_check_uniqueness_gurobi(P0, P1, R0, R1, T, init, alpha, tol)[2]\n",
    "        \n",
    "        if is_unique:\n",
    "            uniqueness_count += 1\n",
    "        if is_degenerate:\n",
    "            degenerate_count += 1\n",
    "        \n",
    "    print(f\"S = {S} and sparse = {sparse}:\")\n",
    "    print(f\"uniqueness_count is {uniqueness_count} out of 10000\")\n",
    "    print(f\"degenerate_count is {degenerate_count} out of 10000\")\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
