{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "goX9NsKXGU0z"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "7GVWcjh65iGv"
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "%config InlineBackend.figure_formats = ['svg']\n",
    "from scipy.linalg import sqrtm\n",
    "from numpy import linalg as LA\n",
    "\n",
    "plt.rcParams.update({'font.size': 14})\n",
    "plt.rcParams[\"figure.figsize\"] = (7,5)\n",
    "import seaborn as sns\n",
    "colors = sns.color_palette(\"colorblind\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Define custom dash patterns for each line without names\n",
    "custom_dashes = [\n",
    "    (1, 0),           # Solid\n",
    "    (1, 1),           # Dotted\n",
    "    (4, 2),           # Dashed\n",
    "    (3, 2, 1, 2),     # Dash-Dot\n",
    "    (5, 2, 1, 2, 1, 2),  # Dash-Dot-Dot\n",
    "    (8, 2),           # Long Dashes\n",
    "    (2, 4),           # Loosely Dashed\n",
    "    (5, 4, 1, 4),     # Sparse Dash-Dot\n",
    "    (6, 4, 1, 4, 1, 4),  # Sparse Dash-Dot-Dot\n",
    "    (1, 4),           # Loosely Dotted\n",
    "    (4, 2, 1, 2, 1, 2),  # Dashed with Dots\n",
    "    (2, 4, 1, 4, 2, 4)   # Custom Pattern 1\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "9iedPQJn5jvq"
   },
   "outputs": [],
   "source": [
    "def cost(x): return 0.5*x.T@H@x + 0.25*landa*(np.sum(x**4)) - 0.1*(1/3)*landa*(np.sum(x**3))\n",
    "def g(x): return H@x + landa*x**3 - 0.1*landa*x**2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "oVZOW6-UeAee"
   },
   "outputs": [],
   "source": [
    "def Algo_Traj(eta, x0, nit, sigma, seed):\n",
    "\n",
    "  np.random.seed(seed)\n",
    "  noise = sigma*np.random.normal(size=(d,))\n",
    "  np.random.seed(seed)\n",
    "\n",
    "  x = np.zeros((nit, d))\n",
    "  v = np.zeros((nit, d))\n",
    "  m = np.zeros((nit, d))\n",
    "  f = np.zeros((nit,))\n",
    "  x[0] = x0\n",
    "  f[0] = cost(x[0])\n",
    "  v[0] = g(x[0]+noise)*g(x[0]+noise)\n",
    "  m[0] = g(x[0]+noise)\n",
    "  for k in range(nit-1):\n",
    "    \n",
    "    gamma_1 = 1/(1 - beta_1**(k+2))\n",
    "    gamma_2 = 1/(1 - beta_2**(k+1))\n",
    "\n",
    "    noise = sigma*np.random.normal(size=(d,))\n",
    "    m[k+1] = beta_1*m[k]+(1-beta_1)*(g(x[k])+noise)\n",
    "    v[k+1] = beta_2*v[k]+(1-beta_2)*(g(x[k])+noise)*(g(x[k])+noise)\n",
    "    x[k+1] = x[k] - eta*(gamma_1*m[k+1])/(np.sqrt(gamma_2*v[k+1])+eps)\n",
    "    f[k+1] = cost(x[k+1])\n",
    "\n",
    "  return (x, f.reshape(f.shape[-1],1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "jyuC11NvEIBq"
   },
   "outputs": [],
   "source": [
    "def SDE_Traj(eta, x0, nit, sigma, seed):\n",
    "\n",
    "  np.random.seed(seed)\n",
    "  noise = sigma*np.random.normal(size=(d,))\n",
    "  np.random.seed(seed)\n",
    "\n",
    "  x = np.zeros((nit, d))\n",
    "  v = np.zeros((nit, d))\n",
    "  m = np.zeros((nit, d))\n",
    "  f = np.zeros((nit,))\n",
    "  x[0] = x0\n",
    "  f[0] = cost(x[0])\n",
    "  v[0] = g(x[0]+noise)*g(x[0]+noise)\n",
    "  m[0] = g(x[0]+noise)\n",
    "  for k in range(nit-1):\n",
    "\n",
    "    noise_wm = np.random.normal(size=(d,))\n",
    "\n",
    "    gamma_1 = 1 - np.exp(-mu1*eta*(k+1))\n",
    "    gamma_2 = 1 - np.exp(-mu2*eta*(k+1))\n",
    "\n",
    "\n",
    "    x[k+1] = x[k] - eta*(np.sqrt(gamma_2)/gamma_1)*(m[k] + eta*mu1*(g(x[k])-m[k]))/(np.sqrt(v[k])  + eps)\n",
    "    v[k+1] = v[k] + mu2*eta*( (g(x[k]))*(g(x[k])) + sigma**2 - v[k]  )\n",
    "    m[k+1] = m[k] + mu1*eta*( g(x[k]) - m[k]  ) + eta*mu1*sigma*noise_wm\n",
    "\n",
    "    f[k+1] = cost(x[k+1])\n",
    "\n",
    "  return (x,  f.reshape(f.shape[-1],1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "cxmnxTniFGVt"
   },
   "outputs": [],
   "source": [
    "def SDE_Malladi_Traj(eta, x0, nit, sigma, seed):\n",
    "\n",
    "  np.random.seed(seed)\n",
    "  noise = sigma*np.random.normal(size=(d,))\n",
    "  np.random.seed(seed)\n",
    "\n",
    "  ####### SDE Malladi\n",
    "\n",
    "  sigma0 = eta #other parameters depend on true eta\n",
    "  eps0 = eps*eta\n",
    "  c1 = (1-beta_1)/(eta*eta)\n",
    "  c2 = (1-beta_2)/(eta*eta)\n",
    "\n",
    "  #sde simulation\n",
    "  x = np.zeros((nit, d))\n",
    "  u = np.zeros((nit, d))\n",
    "  m = np.zeros((nit, d))\n",
    "  f = np.zeros((nit,))\n",
    "  x[0] = x0\n",
    "  f[0] = cost(x[0])\n",
    "  u[0] = g(x[0]+noise)*g(x[0]+noise)\n",
    "  m[0] = g(x[0]+noise)\n",
    "  for k in range(nit-1):\n",
    "    noise_wm = np.random.normal(size=(d,))\n",
    "\n",
    "    u[k+1] = u[k] + eta**2 * c2 * (sigma**2- u[k])\n",
    "    m[k+1] = m[k] + eta**2 * c1 * (g(x[k])- m[k]) + sigma0*c1*sigma*noise_wm*np.sqrt(eta**2)\n",
    "\n",
    "    invP = np.linalg.inv( np.diag(sigma0*np.sqrt(u[k])+eps0) )\n",
    "    gamma_1 = 1 - np.exp(-mu1*eta*(k+1))\n",
    "    gamma_2 = 1 - np.exp(-mu2*eta*(k+1))\n",
    "\n",
    "    x[k+1] = x[k] - eta*eta*(np.sqrt(gamma_1)/gamma_2)*invP@m[k]\n",
    "    f[k+1] = cost(x[k+1])\n",
    "  return (x,  f.reshape(f.shape[-1],1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "ySznf5idOUf8"
   },
   "outputs": [],
   "source": [
    "def SDE_Trajs(eta, x0, nit, sigma, seeds):\n",
    "\n",
    "  d = np.shape(x0)[0]\n",
    "  x_sde = np.zeros((len(seeds), nit+1,d))\n",
    "  f_sde = np.zeros((len(seeds), nit+1,1))\n",
    "\n",
    "  i=0\n",
    "  for seed in seeds:\n",
    "    print(seed)\n",
    "    x_sde[i,:,:], f_sde[i,:,:]  = SDE_Traj(eta, x0, nit+1, sigma, seed)\n",
    "    i += 1\n",
    "\n",
    "  return (x_sde, f_sde)\n",
    "\n",
    "\n",
    "def SDE_Malladi_Trajs(eta, x0, nit, sigma, seeds):\n",
    "\n",
    "  d = np.shape(x0)[0]\n",
    "  x_sde = np.zeros((len(seeds), nit+1,d))\n",
    "  f_sde = np.zeros((len(seeds), nit+1,1))\n",
    "\n",
    "  i=0\n",
    "  for seed in seeds:\n",
    "    print(seed)\n",
    "    x_sde[i,:,:], f_sde[i,:,:]  = SDE_Malladi_Traj(eta, x0, nit+1, sigma, seed)\n",
    "    i += 1\n",
    "\n",
    "  return (x_sde, f_sde)\n",
    "\n",
    "\n",
    "def Algo_Trajs(eta, x0, nit, sigma, seeds):\n",
    "\n",
    "  d = np.shape(x0)[0]\n",
    "  x = np.zeros((len(seeds), nit+1,d))\n",
    "  f = np.zeros((len(seeds), nit+1,1))\n",
    "\n",
    "  i=0\n",
    "  for seed in seeds:\n",
    "    print(seed)\n",
    "    x[i,:,:], f[i,:,:]  = Algo_Traj(eta, x0, nit+1, sigma, seed)\n",
    "    i += 1\n",
    "\n",
    "  return (x, f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "K121PaKMDbr6"
   },
   "outputs": [],
   "source": [
    "d = 2\n",
    "H = np.array([[-1.0, 0.0],[0.0, 2.0]])\n",
    "eta = 0.001\n",
    "sigma = 0.1\n",
    "eps = 1e-8\n",
    "\n",
    "landa = 1.0\n",
    "\n",
    "T= 25\n",
    "nit= int(T/eta)\n",
    "nit_alg = nit\n",
    "nit_sde = nit\n",
    "mu1 = 2\n",
    "mu2 = 1\n",
    "\n",
    "beta_1 = 1-eta*mu1\n",
    "beta_2 = 1-eta*mu2\n",
    "\n",
    "np.random.seed(0)\n",
    "\n",
    "x0 = 1*np.random.normal(size=(d,))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "PB0Pzkm0FuKV"
   },
   "outputs": [],
   "source": [
    "seeds = [i for i in np.arange(100)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "DpL6hyoyOp02",
    "outputId": "08f72a4a-1201-437e-f2c0-a4f9a679e5b3",
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "SDE_Trajs_ = SDE_Trajs(eta, x0, nit, sigma, seeds)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "RE11kz6oOp3m",
    "outputId": "c858ff0d-3a09-408a-db54-df26f93fcf61",
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "SDE_Malladi_Trajs_ = SDE_Malladi_Trajs(eta, x0, nit, sigma, seeds)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "xERLGH0VOp7C",
    "outputId": "0eed7939-ab3e-454d-9b4f-de4d36bf7f6c",
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "Algo_Trajs_ = Algo_Trajs(eta, x0, nit, sigma, seeds)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "tQgz62A-O6s1"
   },
   "outputs": [],
   "source": [
    "avg_SDE_Traj = np.mean(SDE_Trajs_[0],axis=0)\n",
    "avg_SDE_Loss = np.mean(SDE_Trajs_[1],axis=0)\n",
    "\n",
    "std_SDE_Traj = np.std(SDE_Trajs_[0],axis=0)\n",
    "std_SDE_Loss = np.std(SDE_Trajs_[1],axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "y4Dn3DfgO7Eh"
   },
   "outputs": [],
   "source": [
    "avg_SDE_Malladi_Traj = np.mean(SDE_Malladi_Trajs_[0],axis=0)\n",
    "avg_SDE_Malladi_Loss = np.mean(SDE_Malladi_Trajs_[1],axis=0)\n",
    "\n",
    "std_SDE_Malladi_Traj = np.std(SDE_Malladi_Trajs_[0],axis=0)\n",
    "std_SDE_Malladi_Loss = np.std(SDE_Malladi_Trajs_[1],axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "y_2nfBUYO7IG"
   },
   "outputs": [],
   "source": [
    "avg_Algo_Traj = np.mean(Algo_Trajs_[0],axis=0)\n",
    "avg_Algo_Loss = np.mean(Algo_Trajs_[1],axis=0)\n",
    "\n",
    "std_Algo_Traj = np.std(Algo_Trajs_[0],axis=0)\n",
    "std_Algo_Loss = np.std(Algo_Trajs_[1],axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 471
    },
    "id": "GQzbZMZM5vh8",
    "outputId": "7d8ceada-5594-413d-c462-1800bfa276d7"
   },
   "outputs": [],
   "source": [
    "start = 0\n",
    "end = -1\n",
    "\n",
    "min = np.min(avg_Algo_Loss) - 1e-4\n",
    "\n",
    "\n",
    "fact = 0.5\n",
    "\n",
    "plt.figure()\n",
    "# We plot\n",
    "\n",
    "line_3, = plt.plot(avg_SDE_Malladi_Loss[start:end]-min, color = colors[1],linewidth=2, dashes=custom_dashes[1])\n",
    "\n",
    "plt.fill_between( np.arange(0, nit),(avg_SDE_Malladi_Loss[start:end]-min - fact*std_SDE_Malladi_Loss[start:end]).flatten(), (avg_SDE_Malladi_Loss[start:end]-min + fact*std_SDE_Malladi_Loss[start:end]).flatten(),\n",
    "                 color=colors[1], alpha=0.4)\n",
    "\n",
    "line_1, = plt.plot(avg_Algo_Loss[start:end]-min, color = colors[4],linewidth=4)\n",
    "\n",
    "plt.fill_between( np.arange(0, nit),(avg_Algo_Loss[start:end]-min - fact*std_Algo_Loss[start:end]).flatten(), (avg_Algo_Loss[start:end]-min + fact*std_Algo_Loss[start:end]).flatten(),\n",
    "                 color=colors[4], alpha=0.4)\n",
    "\n",
    "line_2, = plt.plot(avg_SDE_Loss[start:end]-min, color = colors[2],linewidth=2, dashes=custom_dashes[2])\n",
    "\n",
    "\n",
    "plt.fill_between( np.arange(0, nit),(avg_SDE_Loss[start:end]-min - fact*std_SDE_Loss[start:end]).flatten(), (avg_SDE_Loss[start:end]-min + fact*std_SDE_Loss[start:end]).flatten(),\n",
    "                 color=colors[2], alpha=0.4)\n",
    "\n",
    "\n",
    "\n",
    "plt.legend([line_1, line_2, line_3], ['Adam','SDE (Ours)', 'SDE (Malladi et al.)'],fontsize=14)\n",
    "plt.title(\"Losses\",fontsize=25)\n",
    "plt.xlabel('Iterations',fontsize=25)\n",
    "plt.ylabel('Loss',fontsize=25)\n",
    "plt.xticks(fontsize=16)\n",
    "plt.yticks(fontsize=16)\n",
    "plt.yscale('log')\n",
    "plt.show()\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "max_x = np.max(np.abs(avg_SDE_Malladi_Traj[:,0]))*1.1\n",
    "max_y = np.max(np.abs(avg_SDE_Malladi_Traj[:,1]))*1.1\n",
    "x_values = np.linspace(-max_x, max_x, 100)\n",
    "y_values = np.linspace(-max_y, max_y, 100)\n",
    "X, Y = np.meshgrid(x_values, y_values)\n",
    "Z = np.zeros_like(X)\n",
    "\n",
    "for i in range(X.shape[0]):\n",
    "    for j in range(X.shape[1]):\n",
    "        Z[i, j] = cost(np.array([X[i, j], Y[i, j]]))\n",
    "plt.contourf(X, Y, Z, cmap='coolwarm')  # Adjust the colormap ('cmap') as needed\n",
    "plt.colorbar()  # Add a colorbar to show the values\n",
    "line_1, = plt.plot(avg_Algo_Traj[:,0], avg_Algo_Traj[:,1], color = colors[4],linewidth=4)\n",
    "line_3, = plt.plot(avg_SDE_Malladi_Traj[:,0], avg_SDE_Malladi_Traj[:,1], color = colors[1],linewidth=2, dashes=custom_dashes[2])\n",
    "line_2, = plt.plot(avg_SDE_Traj[:,0], avg_SDE_Traj[:,1], color = colors[2],linewidth=3, dashes=custom_dashes[2])\n",
    "\n",
    "\n",
    "plt.xlim([-max_x, max_x])\n",
    "plt.ylim([-max_y, max_y])\n",
    "\n",
    "plt.legend([line_1, line_2, line_3], ['Adam','SDE (Ours)', 'SDE (Malladi et al.)'],fontsize=14)\n",
    "\n",
    "plt.title(\"Trajectories\",fontsize=25)\n",
    "plt.xlabel(r'$X_1$',fontsize=25)\n",
    "plt.ylabel(r'$X_2$',fontsize=25)\n",
    "plt.xticks(fontsize=16)\n",
    "plt.yticks(fontsize=16)\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "colab": {
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
