{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import cvxpy as cp\n",
    "import numpy as np\n",
    "from sklearn.metrics.pairwise import rbf_kernel\n",
    "from sklearn.metrics import euclidean_distances\n",
    "import matplotlib.pyplot as plt\n",
    "import math\n",
    "from numpy import asarray\n",
    "from numpy import savetxt\n",
    "from numpy import loadtxt\n",
    "\n",
    "import seaborn as sns\n",
    "sns.set_theme(style=\"darkgrid\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# data generation\n",
    "def generate_data(n = 100, dim = 5, B = 1):\n",
    "    # n: number of samples\n",
    "    # dim: dimension\n",
    "    # X ~ Unif[-B, B]^d\n",
    "    x = np.random.uniform(-B, B, size=[n, dim])\n",
    "    return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# ERM Solver\n",
    "def cvx_loss(v, th, w):\n",
    "    loss = 0.5 * cp.sum_squares(th - v) + (th - v) @ w\n",
    "    return loss\n",
    "\n",
    "def ERM(x, v):        # return \\hat{\\theta}_n\n",
    "    dim = len(x[0])\n",
    "    n = len(x)\n",
    "    # construct the problem\n",
    "    th = cp.Variable(dim)\n",
    "    objective = cp.Minimize(0.5 * cp.sum_squares(th - v) + cp.sum(x @ (th - v)) /n)\n",
    "    prob = cp.Problem(objective)\n",
    "    result = prob.solve(solver = 'MOSEK')\n",
    "    return th.value"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# K-DRO Solver\n",
    "def matrix_decomp(K):\n",
    "    try:\n",
    "        L = np.linalg.cholesky(K)\n",
    "    except:\n",
    "        # print('warning, K is singular')\n",
    "        d, v = np.linalg.eigh(K)     #L == U*diag(d)*U'. the scipy function forces real eigs\n",
    "        d[np.where(d < 0)] = 0       # get rid of small eigs\n",
    "        L = v @ np.diag(np.sqrt(d))\n",
    "    return L\n",
    "    \n",
    "def medium_heuristic(X, Y):\n",
    "    distsqr = euclidean_distances(X, Y, squared=True)\n",
    "    kernel_width = np.sqrt(0.5 * np.median(distsqr))\n",
    "\n",
    "    # in sklearn,\n",
    "    # kernel is done by K(x, y) = exp(-gamma ||x-y||^2)\n",
    "    kernel_gamma = 1.0 / (2 * kernel_width ** 2)\n",
    "\n",
    "    return kernel_width, kernel_gamma\n",
    " \n",
    "def kDroPy(data_emp, v, eta=0.1, n_certify=0, sampling_method='bound', lb=-1, ub=1, solver='MOSEK'):\n",
    "    '''\n",
    "    data_emp: empirical data samples\n",
    "    eta: eta for dro\n",
    "    dim_th: dimension of decision var\n",
    "    n_certify: num of points to certify the semi inf constr.\n",
    "    lb: the upper bound for the domain\n",
    "    the lower bound\n",
    "    '''\n",
    "    n_sample, dim_th = data_emp.shape         # n_sample: # of samples, dim_th: dim of \\theta\n",
    "    th = cp.Variable(dim_th)                  # variable \\theta\n",
    "    constr = []\n",
    "\n",
    "    # KDRO part\n",
    "    a = cp.Variable(n_sample + n_certify)    # variable \\alpha\n",
    "    f0 = cp.Variable()                       # variable f0\n",
    "    \n",
    "    # --------------------------------------------------------------------------------\n",
    "    # Step 1: generate the sampled support\n",
    "    # --------------------------------------------------------------------------------\n",
    "    if sampling_method=='bound':         # sample within certain bound\n",
    "        # let the samples also live in the intervel I sampled uncertainty w\n",
    "        zeta = np.random.uniform(lb, ub, size=[n_certify, dim_th])\n",
    "    elif sampling_method=='hull':        # sample using convex hull of empirical data\n",
    "        # let the samples also live in the intervel I sampled uncertainty w\n",
    "        # this is equiv. to really do it in multi dimensions, need to sample coeff. from a simplex\n",
    "        zeta = np.random.uniform(np.min(data_emp), np.max(data_emp), size=[n_certify, dim_th])\n",
    "    else:\n",
    "        raise NotImplementedError\n",
    "    \n",
    "    # in practice, we always include the empirical data in the sampled support\n",
    "    zeta = np.concatenate([data_emp, zeta])\n",
    "    \n",
    "    # --------------------------------------------------------------------------------\n",
    "    # Step 2: use medium heuristics for kernel width\n",
    "    # --------------------------------------------------------------------------------\n",
    "    kernel_width, kernel_gamma = medium_heuristic(zeta, zeta)\n",
    "    \n",
    "    # --------------------------------------------------------------------------------\n",
    "    # Step 3: setup objective function and constraints\n",
    "    # --------------------------------------------------------------------------------\n",
    "    # evaluate the f, K at the value of zetas\n",
    "    K = rbf_kernel(zeta, zeta, gamma=kernel_gamma)\n",
    "    f = a @ K\n",
    "    \n",
    "    for i in range((len(zeta))):\n",
    "        constr += [cvx_loss(v, th, zeta[i]) <= f0 + f[i]]\n",
    "\n",
    "    obj = f0 + cp.sum(f[0:n_sample]) / n_sample + eta * cp.norm(a.T @ matrix_decomp(K))\n",
    "    opt = cp.Problem(cp.Minimize(obj), constr)\n",
    "   \n",
    "    if solver is None:\n",
    "        opt.solve()\n",
    "    else:\n",
    "        opt.solve(solver=solver)\n",
    "    return th.value #, obj.value, a.value, f0.value, kernel_gamma, zeta"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Loss Function\n",
    "def exp_loss(th, v):\n",
    "    loss = 0.5 * np.sum(np.square(np.subtract(th , v))) \n",
    "    return loss"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def erm_loss(dim, n, v, B, rep):\n",
    "    loss_list = np.zeros(rep)\n",
    "    for i in range(rep):\n",
    "        x = generate_data(n, dim, B)\n",
    "        loss_list[i] = exp_loss(ERM(x, v), v)\n",
    "    mean = np.mean(loss_list)\n",
    "    return mean"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def dro_loss(dim, n, v, B, m, eta, rep):\n",
    "    loss_list = np.zeros(rep)\n",
    "    for i in range(rep):\n",
    "        x = generate_data(n = n, dim = dim, B = 1)\n",
    "        loss_list[i] = exp_loss(kDroPy(x, v, eta=eta, n_certify=m, sampling_method='bound', lb=-1, ub=1, solver='MOSEK'), v)\n",
    "    mean = np.mean(loss_list)\n",
    "    return mean"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Numerical Result\n",
    "- parameters:\n",
    "    - n: number of samples\n",
    "    - m: number of support samples\n",
    "    - d: dimension of x\n",
    "    - rep: number of repitition\n",
    "    - epsilon: ball level\n",
    "- experiments\n",
    "    - fix $d$, $\\epsilon$, varying $n$, $m$ ($m = 10 n$)\n",
    "    - fix $n$, $m$,$d$, varying $\\epsilon$"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "rep = 500\n",
    "dim = 5\n",
    "B_list = [1, 10, 100]\n",
    "#v = np.random.uniform(0.5, 1, size=dim)\n",
    "n_list = [25, 50, 75, 100, 125, 150, 175, 200]\n",
    "m_list = n_list\n",
    "eta_list = [0.01, 0.05, 0.1, 0.15, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1]\n",
    "\n",
    "# save to csv file\n",
    "#savetxt('v.csv', asarray(v), delimiter=',')\n",
    "v = loadtxt('v.csv', delimiter=',')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "erm_mean = np.ones([len(B_list), len(n_list)])\n",
    "for i in range(len(B_list)):\n",
    "    for j in range(len(n_list)):\n",
    "        erm_mean[i][j] = erm_loss(dim, n_list[j], v, B_list[i], 500)\n",
    "        print('B = ' + str(B_list[i]) + ', n = ' + str(n_list[j]) +', average loss = ' + str(erm_mean[i][j]))\n",
    "\n",
    "erm_loss_list1 = asarray(erm_mean[0])\n",
    "erm_loss_list10 = asarray(erm_mean[1])\n",
    "erm_loss_list100 = asarray(erm_mean[2])\n",
    "# save to csv file\n",
    "savetxt('erm_loss_list1.csv', erm_loss_list1, delimiter=',')\n",
    "savetxt('erm_loss_list10.csv', erm_loss_list10, delimiter=',')\n",
    "savetxt('erm_loss_list100.csv', erm_loss_list100, delimiter=',')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%time\n",
    "dro_mean = np.zeros([len(B_list), len(n_list), len(eta_list)])\n",
    "for k in range(len(B_list)):\n",
    "    for i in range(len(n_list)):\n",
    "        print( 'B = ' + str(B_list[k]) + ', n = ' + str(n_list[i]) + ' started' )\n",
    "        for j in range(len(eta_list)):\n",
    "            dro_mean[k][i][j] = dro_loss(dim, n_list[i], v, B_list[k], m_list[i], eta_list[j], rep)\n",
    "\n",
    "dro_loss_list1 = asarray(dro_mean[0])\n",
    "dro_loss_list10 = asarray(dro_mean[1])\n",
    "dro_loss_list100 = asarray(dro_mean[2])\n",
    "# save to csv file\n",
    "savetxt('dro_loss_list1.csv', dro_loss_list1, delimiter=',')\n",
    "savetxt('dro_loss_list10.csv', dro_loss_list10, delimiter=',')\n",
    "savetxt('dro_loss_list100.csv', dro_loss_list100, delimiter=',')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "min_dro_mean = np.zeros([len(B_list), len(n_list)])\n",
    "index_list = np.zeros([len(B_list), len(n_list)])\n",
    "for k in range(len(B_list)):\n",
    "    for i in range(len(n_list)):\n",
    "        min_dro_mean[k][i] = np.min(dro_mean[k][i])\n",
    "        index_list[k][i] = np.argmin(dro_mean[k][i])\n",
    "\n",
    "\n",
    "for k in range(len(B_list)):\n",
    "    print('B = '+ str(B_list[k]) + ': ' + str([eta_list[int(index_list[k][i])] for i in range(len(n_list))]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%time\n",
    "\n",
    "plt.figure()\n",
    "plt.plot(n_list, erm_mean[0], 'b--', label = \"ERM, B=1\", marker = \"s\")\n",
    "plt.plot(n_list, erm_mean[1], 'g--', label = \"ERM, B=10\", marker = \"^\")\n",
    "plt.plot(n_list, erm_mean[2], 'r--', label = \"ERM, B=100\", marker = \"x\")\n",
    "plt.plot(n_list, min_dro_mean[0] , color = 'b', label = \"DRO, B=1\", marker = \"s\")\n",
    "plt.plot(n_list, min_dro_mean[1] , color = 'g', label = \"DRO, B=10\", marker = \"^\")\n",
    "plt.plot(n_list, min_dro_mean[2] , color = 'r', label = \"DRO, B=100\", marker = \"x\")\n",
    "\n",
    "plt.yscale('log')\n",
    "plt.legend(loc = \"best\")\n",
    "#plt.legend(loc = \"upper left\", bbox_to_anchor=(1.05, 1))\n",
    "\n",
    "plt.xlabel('sample size n')\n",
    "plt.ylabel('excess risk')\n",
    "\n",
    "plt.xticks(n_list, n_list)\n",
    "\n",
    "plt.savefig('regression_n.eps', format='eps', bbox_inches = 'tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%time\n",
    "\n",
    "plt.figure()\n",
    "\n",
    "plt.plot(eta_list, erm_mean[0][1] * np.ones(len(eta_list)), 'b--', label = \"ERM, B=1, n=50\")\n",
    "plt.plot(eta_list, erm_mean[0][3] * np.ones(len(eta_list)), 'g', label = \"ERM, B=1, n=100\")\n",
    "plt.plot(eta_list, erm_mean[0][7] * np.ones(len(eta_list)), 'r:', label = \"ERM, B=1, n=200\")\n",
    "\n",
    "plt.plot(eta_list, dro_mean[0][1] , color = 'b', label = \"DRO, B=1, n=50\", marker = \"s\")\n",
    "plt.plot(eta_list, dro_mean[0][3] , color = 'g', label = \"DRO, B=1, n=100\", marker = \"^\")\n",
    "plt.plot(eta_list, dro_mean[0][7] , color = 'r', label = \"DRO, B=1, n=200\", marker = \"x\")\n",
    "\n",
    "\n",
    "\n",
    "plt.yscale('log')\n",
    "plt.legend(loc = \"best\")\n",
    "\n",
    "plt.xlabel(r\"$\\eta$\")\n",
    "plt.ylabel('excess risk')\n",
    "plt.legend(loc = \"best\")\n",
    "#plt.legend(loc = \"upper left\", bbox_to_anchor=(1.05, 1))\n",
    "\n",
    "x_ticks = [0.01, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1]\n",
    "\n",
    "plt.xticks(x_ticks, x_ticks)\n",
    "\n",
    "plt.savefig('regression_eta.eps', format='eps', bbox_inches = 'tight')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
