{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "e29b8992",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "from sklearn.linear_model import LinearRegression\n",
    "import seaborn as sns\n",
    "import matplotlib.pyplot as plt\n",
    "import numpy as np\n",
    "from scipy.stats import norm\n",
    "import pandas as pd\n",
    "import scipy\n",
    "from scipy.stats import chi2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "165d003c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# define reward function\n",
    "def get_noise():\n",
    "    return  np.random.poisson(1,1)[0] - 1\n",
    "\n",
    "\n",
    "def get_unitv(d):\n",
    "    # generate unit vector in sphere\n",
    "    x = np.random.normal(0,1,d)\n",
    "    return x/np.linalg.norm(x)\n",
    "\n",
    "def get_Actions(num,d):\n",
    "    return np.array([get_unitv(d) for i in range(num)])\n",
    "    \n",
    "\n",
    "# stochastic regression\n",
    "def ECB(n, Actions):\n",
    "    d = Actions.shape[1]\n",
    "    initial_run = Actions.shape[0]\n",
    "    theta = np.array([0.3]*d).reshape(-1,1)\n",
    "    \n",
    "    # data matrix\n",
    "    X = Actions.copy()\n",
    "    \n",
    "    # contextual bandits - action set\n",
    "    y = X@theta + np.array([get_noise() for i in range(initial_run)]).reshape(-1,1)\n",
    "    \n",
    "    y = y.reshape(-1)\n",
    "    nums = np.ones(initial_run)\n",
    "    rewards = y.copy().reshape(-1)\n",
    "    \n",
    "    for i in range(n-initial_run):\n",
    "        arm_means = rewards/nums\n",
    "        arm = np.argmax(arm_means)\n",
    "        # defining decaying rate\n",
    "        flag = np.random.uniform(0,1,1)[0]\n",
    "        if flag > np.log(i+1)**2/(i+1) and i > 50:\n",
    "            arm = np.random.randint(1,1+ initial_run) - 1\n",
    "        \n",
    "        # append new observation\n",
    "        newx = Actions[arm,:]\n",
    "        X = np.append(X, newx.reshape(1,-1), axis = 0 )\n",
    "        newr = np.sum(newx*0.3)  + get_noise()\n",
    "        y = np.append(y, newr)\n",
    "        \n",
    "    return X, y"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "b7c1085d",
   "metadata": {},
   "source": [
    "## $\\Sigma_0 = \\log(n)$"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "dcb9104e",
   "metadata": {},
   "outputs": [],
   "source": [
    "def Volumn(V):\n",
    "    # given a matrix V, compute the volumn correspoing to the ellipse of the format x^T V x \\leq 1\n",
    "    # universal constant are dropped\n",
    "    s =  np.linalg.svd(V)[1]\n",
    "    return 1/np.product(np.sqrt(s))\n",
    "\n",
    "\n",
    "\n",
    "def scaled_estimators(n, Actions, wlam, clam, sampler, alpha_list): # need to add lambda as tuning parameter here. \n",
    "    \n",
    "    d = Actions.shape[1]\n",
    "    # consider confidence level \n",
    "    siglevel = 1 - alpha_list \n",
    "    siglevelLen = np.size(siglevel)\n",
    "    cql = chi2.ppf(siglevel, d)\n",
    "    \n",
    "    true_theta = np.array([0.3]*d).reshape(-1,1)\n",
    "    CI_data = np.zeros((2, siglevelLen * 4 )) # KK -- first row is coverage and second row is volume. Times 4 means 4 methods\n",
    "    # OLS, W decor, concentration and ALEE (asymptotic) ? \n",
    "    \n",
    "    X,y = sampler(n, Actions)\n",
    "    #######################################\n",
    "    # compute OLS\n",
    "    M = LinearRegression(fit_intercept = False).fit(X, y)\n",
    "    coeff = M.coef_.copy().reshape(-1,1)\n",
    "    Sn = X.T@X\n",
    "    residual = y.reshape(-1,1) - X@coeff\n",
    "    # compute residual and use it as an estimate of sigma^2\n",
    "    sig_h = np.sqrt(np.mean(residual**2))\n",
    "    \n",
    "    c = 1/sig_h**2*(coeff.reshape(1,-1)- true_theta.reshape(1,-1))@Sn@(coeff - true_theta)\n",
    "    c = c.reshape(-1)[0]\n",
    "\n",
    "    ## KK -- what does this part of code do?\n",
    "    \n",
    "    for i in range(siglevelLen): # KK --  3 -- is the number of significance level ?\n",
    "        cq = cql[i]\n",
    "        cover = c < cq - 0\n",
    "        v = Volumn(Sn/sig_h**2/cq)\n",
    "        v = np.log(v)\n",
    "        CI_data[:,0 + 4*i] = np.array([cover, v]).reshape(-1)  # KK -- coverage values grouped by significance levels \n",
    "     \n",
    "    #######################################\n",
    "    # W-decorrelation\n",
    "    W_lambdas = np.ones(n)*wlam\n",
    "    wols = M.coef_.copy().reshape(-1)\n",
    "    w = np.zeros((d,1))\n",
    "    WX = np.zeros((d,d))\n",
    "    W = np.zeros_like(X)\n",
    "    for t in range(n):\n",
    "        w = (np.eye(d) - WX)@X[t,:].reshape(-1,1) \n",
    "        w = w/(np.sum(X[t,:]**2) + W_lambdas[t])\n",
    "        W[t, :] = w.reshape(-1)\n",
    "        wols += w.reshape(-1) * (y[t] - np.sum(X[t,:]*coeff.reshape(-1)) ) \n",
    "        WX = WX + w@X[t,:].reshape(1,-1)\n",
    "        \n",
    "    WW = np.linalg.inv(W.T@W)\n",
    "   \n",
    "    # compute statistic\n",
    "    c = 1/sig_h**2*(wols - true_theta.reshape(1,-1))@WW@(wols.reshape(-1,1) - true_theta)\n",
    "    c = c.reshape(-1)[0]\n",
    "    for i in range(siglevelLen):    ## KK -- same comment here, is 3 the number of target coverage level? \n",
    "        cq = cql[i]\n",
    "        cover = c < cq - 0\n",
    "        v = Volumn(WW/sig_h**2/cq)\n",
    "        v = np.log(v)\n",
    "        CI_data[:,1 + 4*i] = np.array([cover, v]).reshape(-1)  # coverage grouped by significance levels\n",
    "    \n",
    "   \n",
    "    \n",
    "    ######################################\n",
    "    #  Modified ALEE - log(n) # Sigma_0 = log_n hard encoded. \n",
    "    Z = np.zeros_like(X)\n",
    "    Sigma0 = np.log(n)**0.5*np.eye(d)\n",
    "    for t in range(n):\n",
    "        if t == 0:\n",
    "            S = Sigma0\n",
    "        else:\n",
    "            S = Sigma0 + X[:t,:].T@X[:t,:]\n",
    "        \n",
    "        svd_u, svd_s, svd_v = np.linalg.svd(S, full_matrices=True)\n",
    "        \n",
    "        S_invh = svd_u@np.diag(svd_s**(-0.5))@svd_v\n",
    "\n",
    "        zt = S_invh@X[t,:].reshape(-1,1)\n",
    "        \n",
    "        Z[t,:] = zt.reshape(-1)\n",
    "    \n",
    "    \n",
    "    W = np.zeros_like(Z)\n",
    "    vt = np.eye(d)\n",
    "    for i in range(n):\n",
    "        # zi\n",
    "        z = Z[i,:].reshape(1,-1)\n",
    "        vtt = vt.copy()\n",
    "        term_deno = 1 + z@vtt@z.T\n",
    "        term_deno = term_deno.reshape(-1)[0]\n",
    "        \n",
    "        # update\n",
    "        vt = vtt - vtt@z.T@z@vtt/term_deno\n",
    "        w = np.sqrt(term_deno)*vt@z.T\n",
    "\n",
    "        W[i,:] = w.reshape(-1)\n",
    "        \n",
    "    \n",
    "    ######### design new Zt\n",
    "    kappa = np.log(n)\n",
    "    tau = np.exp(1)*np.sqrt(np.log(n))\n",
    "    Z1 = np.copy(Z)\n",
    "    Vn_inv = np.eye(d) + Z1.T@Z1\n",
    "    evalues, evectors = np.linalg.eig(Vn_inv)\n",
    "    \n",
    "    addn = 0\n",
    "    # construct new Z\n",
    "    for i in range(d):\n",
    "        if evalues[i] < kappa:\n",
    "            dn = int((kappa - evalues[i])*tau)\n",
    "            addn = addn + dn\n",
    "            Z1 = np.concatenate((Z1, np.tile(evectors[:,i], (dn,1))/tau), axis = 0)\n",
    "    \n",
    "    \n",
    "    addW = np.zeros((addn,d))\n",
    "    \n",
    "    for i in range(addn):\n",
    "        z = Z1[i+n,:].reshape(1,-1)\n",
    "        vtt = vt.copy()\n",
    "        term_deno = 1 + z@vtt@z.T\n",
    "        term_deno = term_deno.reshape(-1)[0]\n",
    "        \n",
    "        # update\n",
    "        vt = vtt - vtt@z.T@z@vtt/term_deno\n",
    "        w = np.sqrt(term_deno)*vt@z.T\n",
    "        \n",
    "        addW[i,:] = w.reshape(-1)\n",
    "    \n",
    "    # simulate gaussian random variable\n",
    "    new_error = np.random.normal(0, sig_h, addn).reshape(-1,1)\n",
    "    \n",
    "    # design new estimator\n",
    "    A = W.T@X\n",
    "    alee = np.linalg.inv(A)@(W.T@y.reshape(-1,1) + addW.T@new_error)\n",
    "    \n",
    "    \n",
    "    OSn = A.T@A\n",
    "    \n",
    "    c = 1/sig_h**2*(alee.reshape(1,-1)- true_theta.reshape(1,-1))@OSn@(alee - true_theta)\n",
    "    c = c.reshape(-1)[0]\n",
    "    for i in range(siglevelLen):\n",
    "        cq = cql[i]\n",
    "        cover = c < cq - 0\n",
    "        \n",
    "        v = Volumn(OSn/sig_h**2/cq)\n",
    "        v = np.log(v)\n",
    "        CI_data[:,2 + 4*i] = np.array([cover, v]).reshape(-1)  # grouped by significance level.\n",
    "\n",
    "    \n",
    "  \n",
    "    \n",
    "    ######################################\n",
    "    # ridge concentration\n",
    "    # set S\n",
    "    S = np.sqrt(d)\n",
    "    rols = np.linalg.inv(X.T@X + clam*np.eye(d))@X.T@y.reshape(-1,1)\n",
    "\n",
    "    # Adding lambdaPar value - clam\n",
    "    Vt = clam * np.eye(d) + Sn\n",
    "\n",
    "    \n",
    "    delta_list = alpha_list.copy()\n",
    "    \n",
    "    c = (rols.reshape(1,-1) - true_theta.reshape(1,-1))@Vt@(rols - true_theta)\n",
    "    c = c.reshape(-1)[0]\n",
    "    \n",
    "    for i in range(siglevelLen):\n",
    "        delta = delta_list[i]\n",
    "        ## Needs to be checked \n",
    "        cq = sig_h*np.sqrt(np.log(np.linalg.det(Vt)/delta**2) - d*np.log(clam)) + np.sqrt(clam)*S \n",
    "        # lambda = 1 and S = |thetastar| \\leq 2   \n",
    "        cover = c < cq**2 - 0\n",
    "        v = Volumn(Vt/cq**2)\n",
    "        v = np.log(v)\n",
    "        CI_data[:,3 + 4*i] = np.array([cover, v]).reshape(-1)\n",
    "    \n",
    "\n",
    "    return CI_data\n",
    "    \n",
    "    \n",
    "    \n",
    "#   replication function\n",
    "# need to change this part to accomodate siglevels \n",
    "# N -- number of replications \n",
    "# n -- sample size \n",
    "\n",
    "def ACV_repli(N , n, Actions, wlam, clam,  sampler, alpha_list):\n",
    "    nalpha = np.size(alpha_list)\n",
    "    \n",
    "    E = np.zeros((nalpha, N, 8))\n",
    "    \n",
    "    for i in range(N):\n",
    "        print(i)\n",
    "        output = scaled_estimators(n, Actions, wlam, clam, sampler, alpha_list)\n",
    "        for k in range(nalpha):\n",
    "            E[k,i,:] = output[:,(4*k):(4*k+4)].reshape(1,8)\n",
    "        \n",
    "    return E"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "359d097e",
   "metadata": {},
   "outputs": [],
   "source": [
    "# This is for W-decorrelaton lambda stuff. \n",
    "\n",
    "def compute_lam(N, n, sampler, Actions):\n",
    "    \n",
    "    record = np.zeros(N)\n",
    "    for k in range(N):\n",
    "        \n",
    "        X,y = sampler(n,Actions)\n",
    "\n",
    "        evalue, evector = np.linalg.eig(X.T@X)\n",
    "        \n",
    "        record[k] = np.min(evalue)\n",
    "        \n",
    "    return np.percentile(record, 10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "9fc05ff0",
   "metadata": {},
   "outputs": [],
   "source": [
    "np.random.seed(517)\n",
    "Actions = get_Actions(60, 50)\n",
    "# first input is the number of actions and second one is dimension.\n",
    "\n",
    "np.random.seed(517)\n",
    "# compute_lam(N, n, sampler, Actions) \n",
    "wlam = compute_lam(1000, 1000, ECB, Actions)/np.log(1000) # this is for W decorrelation "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bafb83a7",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0\n",
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(517)\n",
    "Actions = get_Actions(60, 50)\n",
    "\n",
    "np.random.seed(517)\n",
    "alpha_list = np.array([0.2, 0.15,0.1])\n",
    "E = ACV_repli(1000, 1000, Actions, wlam, clam = 0.01, sampler = ECB, alpha_list=  alpha_list )"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "7632462b",
   "metadata": {},
   "source": [
    "# Confidence level first one"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "97abdc18",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame(np.mean(E[0,:,:], axis = 0).reshape(2,4), columns = ['ols','W', 'ALEE-logn', 'Concentration'])\n",
    "round(df,3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bed1a1be",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame(np.std(E[0,:,:], axis = 0).reshape(2,4), columns = ['ols','W', 'ALEE-logn', 'Concentration'])\n",
    "round(df,3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "28b1f83c",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "987edb67",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "65f06edb",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame(np.mean(E[1,:,:], axis = 0).reshape(2,4), columns = ['OLS','W', 'ALEE-logn', 'Concentration'])\n",
    "round(df,3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "34cb2eb6",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame(np.std(E[1,:,:], axis = 0).reshape(2,4), columns = ['OLS','W', 'ALEE-logn', 'Concentration'])\n",
    "round(df,3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "10282637",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "26dde673",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "60cbe407",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame(np.mean(E[2,:,:], axis = 0).reshape(2,4), columns = ['ols','W', 'ALEE-logn', 'Concentration'])\n",
    "round(df,3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e9fd9fa7",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame(np.std(E[2,:,:], axis = 0).reshape(2,4), columns = ['OLS','W', 'ALEE-logn', 'Concentration'])\n",
    "round(df,3)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
