{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from sklearn.metrics import mean_squared_error\n",
    "from function import Kernel_sobo, choose_lam_r_quantile\n",
    "import numpy as np\n",
    "import scipy.stats as stats\n",
    "import tqdm\n",
    "# plot image of mse for fixed r and varing sample size\n",
    "import matplotlib.pyplot as plt\n",
    "np.random.seed(10)\n",
    "\n",
    "\n",
    "def scale_kernel(alpha, x, y):\n",
    "    \"\"\"define the spike kernel\"\"\"\n",
    "    return 2*sum(np.cos(2*np.pi*k*(x-y))/((k+1)**alpha) for k in range(100))+1\n",
    "\n",
    "\n",
    "#specify kernel function\n",
    "def kernel_spike(alpha, x, y):\n",
    "    \"\"\"define the spike kernel\"\"\"\n",
    "    n = x.shape[0]\n",
    "    m = y.shape[0]\n",
    "    K = np.zeros([n,m])\n",
    "    for i in range(n):\n",
    "        for j in range(m):\n",
    "            K[i,j] = scale_kernel(alpha, x[i], y[j])\n",
    "    return K\n",
    "\n",
    "\n",
    "# underlying mean regression function\n",
    "def f_0(x):\n",
    "    \"\"\"define the mean regression function for 1-dimensional KRR (Example S1 in supplementary material)\"\"\"\n",
    "    return scale_kernel(3.5,x,0)*np.sin(1*x)\n",
    "\n",
    "sd = 2\n",
    "tau = 0.5\n",
    "f_true = f_0\n",
    "\n",
    "def generate_data(n, f):\n",
    "    \"\"\"generate data from the mean regression function f (f_0 or f_1)\"\"\"\n",
    "    x_train=np.sort(np.random.rand(n))\n",
    "    y_train=f(x_train)+np.random.normal(0, sd, n) - stats.norm.ppf(tau, loc=0, scale=sd)\n",
    "    return x_train,y_train\n",
    "\n",
    "\n",
    "\n",
    "alpha_list = [2, 4, 6, 8, 10]\n",
    "n = 300\n",
    "iter_num = 50\n",
    "mse_list = np.zeros([iter_num, len(alpha_list), 2])\n",
    "mse_mean = np.zeros([len(alpha_list), 2])\n",
    "mse_var = np.zeros([len(alpha_list), 2])\n",
    "\n",
    "for i in range(len(alpha_list)):\n",
    "    alpha = alpha_list[i]\n",
    "    for j in tqdm.tqdm(range(iter_num)):\n",
    "        x_train, y_train = generate_data(n,  f_true)\n",
    "        y_true = f_true(x_train)\n",
    "        K = kernel_spike(alpha, x_train, x_train)\n",
    "        mse_list[j, i, 0] = choose_lam_r_quantile(K, y_train, y_true, truncation=True, tau=tau, loss_type=\"excess_risk\")\n",
    "        mse_list[j, i, 1] = choose_lam_r_quantile(K, y_train, y_true, truncation=False, tau=tau, loss_type=\"excess_risk\")\n",
    "    mse_mean[i, 0] = np.mean(mse_list[:, i, 0])\n",
    "    mse_var[i, 0] = np.std(mse_list[:, i, 0])\n",
    "    mse_mean[i, 1] = np.mean(mse_list[:, i, 1])\n",
    "    mse_var[i, 1] = np.std(mse_list[:, i, 1])\n",
    "    print(\"alpha=\", alpha_list[i], \",truncated mean mse=\", format(mse_mean[i, 0], '.3f'),  \",full mean mse=\", format(mse_mean[i, 1], '.3f'))\n",
    "    print(\"alpha=\", alpha_list[i], \",truncated std mse=\", format(mse_var[i, 0], '.3f'),  \",full var mse=\", format(mse_var[i, 1], '.3f'))\n",
    "print(\"hyperparameters is\", \"n =\", n,  \"alpha_list = \", alpha_list, \"iter_num = \", iter_num, \"tau = \", tau, \"sd = \", sd)\n",
    "plt.plot(alpha_list, mse_mean[:, 0], label=\"truncated mean\")\n",
    "plt.plot(alpha_list, mse_mean[:, 1], label=\"full\")\n",
    "plt.fill_between(alpha_list, mse_mean[:, 0]-mse_var[:, 0], mse_mean[:, 0]+mse_var[:, 0], alpha=0.2)\n",
    "plt.fill_between(alpha_list, mse_mean[:, 1]-mse_var[:, 1], mse_mean[:, 1]+mse_var[:, 1], alpha=0.2)\n",
    "plt.legend()\n",
    "plt.xlabel('alpha')\n",
    "plt.ylabel('excess risk')\n",
    "plt.title('KQR, tau=0.5')\n",
    "plt.show()\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "d2l",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
