{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "0a0d7513",
   "metadata": {},
   "source": [
    "<a id=\"Leaky ReLU\"></a>\n",
    "\n",
    "## Stochasitc Leaky ReLU regression\n",
    "\n",
    "\n",
    "<p>\n",
    "$$ \\frac{1}{2}   \\sum_{i=1} \\left( \\sigma( w^\\top x_i )  - y_i     \\right)^2, $$\n",
    "</p>\n",
    "where $\\sigma(z) = \\max( \\alpha z, z )$ with $1 > \\alpha > 0$ the Leaky ReLU. It is assumed that there exists a $w_* \\in \\mathcal{R}^d$ such that $y_i = \\langle w_* , x_i \\rangle$.\n",
    "ReLU is the case when $\\alpha=0$."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "62372a47",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import time\n",
    "import myHSS\n",
    "import matplotlib\n",
    "import matplotlib.pyplot as plt\n",
    "kwargs = {'linewidth' : 7.0}\n",
    "font = {'weight' : 'normal',\n",
    "        'size'   : 28}\n",
    "matplotlib.rc('font', **font)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6371e535",
   "metadata": {},
   "outputs": [],
   "source": [
    "def LeakyReLU_subgradient(z, alpha=0.1):\n",
    "    g = np.ones(z.shape)\n",
    "    g[z < 0] = alpha\n",
    "    return g\n",
    "\n",
    "def LReLU(z,alpha=0.1):\n",
    "    return np.maximum( z, alpha*z )\n",
    "\n",
    "def LeakyReLU_fval(A, y, w, num, alpha=0.1):\n",
    "    # A is a data matrix, y is a vector of labels\n",
    "    Aw = np.dot(A,w)\n",
    "    return np.sum( (LReLU(Aw, alpha) - y  )**2 ) / num\n",
    "\n",
    "def LeakyReLUopt_grad(A, y, w, num, alpha=0.1):\n",
    "    #randomly computes a stochastic pseudo gradient\n",
    "    idd = np.random.randint(num)\n",
    "    return ( LReLU( np.dot( A[idd,] , w ) ) - y[idd] ) * A[idd,:].T \n",
    "\n",
    "def LeakyReLU(w, func_only=False, grad_only=False):\n",
    "    alpha = 0.1\n",
    "    if (func_only == True):\n",
    "        return LeakyReLU_fval(A,y,w,num,alpha)\n",
    "    if (grad_only)== True:\n",
    "        return LeakyReLUopt_grad(A, y, w, num, alpha)\n",
    "    return LeakyReLU_fval(A,y,w, num, alpha), LeakyReLUopt_grad(A, y, w, num, alpha)\n",
    "\n",
    "\n",
    "def GDupdate(wold, eta, grad):\n",
    "    w = wold - eta*grad\n",
    "    return w\n",
    "\n",
    "num, d  = 1000, 50\n",
    "A     = np.random.normal(0, 1, (num,d) )\n",
    "wstar = np.random.normal(0, 1, d)\n",
    "y     = LReLU( np.dot(A,wstar)) \n",
    "#############################################################\n",
    "w_init = (10**-2)*np.random.normal(0, 1, d)\n",
    "iters = 20000\n",
    "#------------------------------------------------------------\n",
    "#perform GD\n",
    "eta_candi   = [10**-2]\n",
    "dist_arrGD  = np.zeros([len(eta_candi), iters+1])\n",
    "cpu_arrGD   = np.zeros([len(eta_candi), iters+1])\n",
    "w_GD = w_init\n",
    "\n",
    "for q in range(len(eta_candi)):\n",
    "    eta = eta_candi[q]\n",
    "    elarpsed = 0\n",
    "    dist_arrGD[q,0] = np.linalg.norm(w_GD-wstar)\n",
    "    cpu_arrGD[q,0]  = elarpsed\n",
    "    for i in range(iters):\n",
    "        start = time.time()\n",
    "        w_GD = GDupdate(w_GD, eta, LeakyReLUopt_grad(A,y,w_GD,num) )\n",
    "        dist_arrGD[q,i+1] = np.linalg.norm(w_GD-wstar)\n",
    "        elarpsed += time.time() - start\n",
    "        cpu_arrGD[q,i+1]  = elarpsed                \n",
    "#########################################################\n",
    "idd_GD = np.argmin( dist_arrGD[:,iters] ) \n",
    "print('=== idd_GD:', idd_GD)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d7c62a31",
   "metadata": {},
   "outputs": [],
   "source": [
    "def Continuizedupdate(v, w, z, rho, mu, L, A, y, num):\n",
    "    gamma  =  1./L\n",
    "    gamma1 =  1./np.sqrt(mu*L) \n",
    "    sta    =  np.exp( -(1.+rho)* np.sqrt( mu/L )* np.random.exponential(1,1)  )\n",
    "    tau    =  1./(1+rho)*(1. - sta )\n",
    "    tau1   =  rho*(1.- sta) / (rho + sta)\n",
    "\n",
    "    v1 = w + tau*( z - w)  \n",
    "    grad = LeakyReLUopt_grad(A,y,v1,num)\n",
    "    w1  = v1 - gamma*grad\n",
    "    z1  = z  + tau1*(v1-z) - gamma1 * grad\n",
    "    return v1, w1, z1\n",
    "#----------------------------------------------------------------------------\n",
    "L_candi    = [100]  # \\tilde{\\kappa} R^2 in Theorem 3     \n",
    "mu_candi   = [10]   \n",
    "rho_candi  = [1]    # as \\eta = \\eta' in Theorem 3\n",
    "#-------------------------------------------------------------------------\n",
    "runs = 10\n",
    "dist_arrConti  = np.zeros( [len(L_candi), iters+1, runs] )\n",
    "cpu_arrConti   = np.zeros( [len(L_candi), iters+1, runs] )\n",
    "for q in range(len(L_candi)):\n",
    "    print(\"q\",q)\n",
    "    L   =  L_candi[q]\n",
    "    mu  = mu_candi[q]\n",
    "    rho =rho_candi[q]\n",
    "    for r in range(runs):\n",
    "        v_Conti   = w_init\n",
    "        w_Conti   = w_init\n",
    "        z_Conti   = w_init\n",
    "        elarpsed = 0\n",
    "        dist_arrConti[q,0,r] = np.linalg.norm(w_Conti-wstar)\n",
    "        cpu_arrConti[q,0,r]  = elarpsed\n",
    "        for i in range(iters):\n",
    "            start = time.time()\n",
    "            v_Conti, w_Conti, z_Conti = Continuizedupdate(v_Conti,w_Conti,z_Conti,rho,mu,L,A,y,num)\n",
    "            dist_arrConti[q,i+1,r] = np.linalg.norm(w_Conti-wstar)\n",
    "            elarpsed += time.time() - start\n",
    "            cpu_arrConti[q,i+1,r]  = elarpsed                \n",
    "dist_Conti_mean = np.mean( dist_arrConti, axis=2 )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b0e8f97c",
   "metadata": {},
   "outputs": [],
   "source": [
    "idd_conti = np.argmin( dist_Conti_mean[:,iters] ) \n",
    "print('=== idd_conti:', idd_conti)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0fb0caad",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "\n",
    "shows = 16000\n",
    "ts = np.arange( shows )\n",
    "print(ts.shape)\n",
    "#'-', '--', '-.', ':', '',\n",
    "plt.figure(figsize=(14, 8))\n",
    "plt.title('distance v.s. iteration')\n",
    "texa = \"Stochastic GLMtron\"\n",
    "plt.yscale( 'log' ) \n",
    "plt.plot(ts, dist_arrGD[idd_GD,:shows], 'r-', label= texa, linestyle='--', **kwargs)\n",
    "#=============================================================================\n",
    "#compute mean and std\n",
    "dist_Conti_mean = np.mean( dist_arrConti, axis=2 )\n",
    "dist_Conti_std  = np.std( dist_arrConti, axis=2 )\n",
    "texb = \"Acc. Stochastic GLMtron\"\n",
    "plt.plot(ts, dist_Conti_mean[idd_conti,:shows], 'g-', label= texb, linestyle='-', **kwargs)\n",
    "plt.fill_between(ts, dist_Conti_mean[idd_conti,:shows], dist_Conti_mean[idd_conti,:shows] + dist_Conti_std[idd_conti,:shows], color='gray', alpha=0.2)\n",
    "plt.xlim([0,13000])\n",
    "\n",
    "plt.legend()\n",
    "plt.ylabel('distance')\n",
    "plt.xlabel('iteration')\n",
    "\n",
    "myname = \"Stochastic01\"\n",
    "hi = \"./figures/\" + myname + \"_iters.jpg\"\n",
    "plt.savefig(hi)\n",
    "\n",
    "plt.show();\n",
    "\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
