{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "af1e0909-65dd-4c1f-8f13-e6b5aed09fc9",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "from gpcam import GPOptimizer\n",
    "import matplotlib.pyplot as plt\n",
    "import random\n",
    "import torch"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1a6020cc",
   "metadata": {},
   "outputs": [],
   "source": [
    "#Create data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b1585408",
   "metadata": {},
   "outputs": [],
   "source": [
    "from itertools import product\n",
    "x_pred1D = np.linspace(0,1,1000).reshape(-1,1)\n",
    "def f1(x):\n",
    "    return np.sin(5. * x) + np.cos(20. * x) + (2.* (x-0.4)**2) * np.cos(400. * x)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "aeef5f69-32ab-4be1-81cb-d41123dd9f54",
   "metadata": {},
   "outputs": [],
   "source": [
    "x_train_1d = np.genfromtxt(\"data/x_train_1d.csv\").reshape(-1,1)\n",
    "y_train_1d = np.genfromtxt(\"data/y_train_1d.csv\")\n",
    "\n",
    "\n",
    "x_test_1d = np.genfromtxt(\"data/x_test_1d.csv\").reshape(-1,1)\n",
    "y_test_1d = np.genfromtxt(\"data/y_test_1d.csv\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "6ebc3785-2ce5-4966-a61a-ad7d79f22d92",
   "metadata": {},
   "source": [
    "### 1d - gp2Scale"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "eaf94b49",
   "metadata": {},
   "outputs": [],
   "source": [
    "import dask\n",
    "from dask.distributed import Client\n",
    "import os\n",
    "import time\n",
    "\n",
    "scheduler_file = os.path.join(os.environ[\"SCRATCH\"], \"scheduler_file1d.json\")\n",
    "\n",
    "dask.config.config[\"distributed\"][\"dashboard\"][\"link\"] = \"{JUPYTERHUB_SERVICE_PREFIX}proxy/{host}:{port}/status\" \n",
    "\n",
    "while True:\n",
    "    time.sleep(2)\n",
    "    if os.path.isfile(scheduler_file):\n",
    "        print(\"file found\")\n",
    "        time.sleep(5)\n",
    "        client = Client(scheduler_file=scheduler_file)\n",
    "        break\n",
    "print(\"waiting for workers\")\n",
    "client.wait_for_workers(8)\n",
    "print(client)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dfe452b7-84b9-46ed-8e92-97ad7723f52f",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "hps_bounds = np.array([\n",
    "                      [0.1, 4.],\n",
    "                      [0.1, 4.],\n",
    "                      [0.1, 4.],\n",
    "                      [0.001, 0.5],\n",
    "                      [0.001, 0.5],\n",
    "                      [0.001, 0.5]])  ##length scale for Wendland kernel\n",
    "\n",
    "init_hps = np.random.uniform(size = len(hps_bounds), low = hps_bounds[:,0], high = hps_bounds[:,1])\n",
    "\n",
    "\n",
    "def sig(x, hps): \n",
    "    hps2 = 0.1\n",
    "    return ((hps[0] * np.exp(-(x**2)/hps2)) + \n",
    "            (hps[1] * np.exp(-((x-0.5)**2)/hps2)) + \n",
    "            (hps[2] * np.exp(-((x-1.0)**2)/hps2)))\n",
    "\n",
    "def rad(x, hps): \n",
    "    hps2 = 0.1\n",
    "    return ((hps[3] * np.exp(-(x**2)/hps2)) + \n",
    "            (hps[4] * np.exp(-(x-0.5)**2/hps2)) + \n",
    "            (hps[5] * np.exp(-(x-1.0)**2/hps2)))\n",
    "\n",
    "\n",
    "from gpcam.gp_kernels import *\n",
    "def gibbs_wendland(x1,x2,hps):\n",
    "    d = get_distance_matrix(x1,x2)\n",
    "    radius1 = rad(x1, hps)\n",
    "    radius2 = rad(x2, hps)\n",
    "    s1 = sig(x1, hps)\n",
    "    s2 = sig(x2, hps)\n",
    "    \n",
    "    r = np.add.outer(radius1**2, radius2**2).reshape(len(x1),len(x2))\n",
    "    A = np.sqrt(2. * np.outer(radius1, radius2)/ r)\n",
    "    \n",
    "    a = np.sqrt(d**2/r)\n",
    "    a[a>1.] = 1.\n",
    "    kernel = A * (1.-a)**8 * (35.*a**3 + 25.*a**2 + 8.*a + 1.)\n",
    "    return np.outer(s1,s2) * kernel\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "75dd1752",
   "metadata": {},
   "outputs": [],
   "source": [
    "my_gp2S = GPOptimizer(x_train_1d,y_train_1d,init_hyperparameters=init_hps, \n",
    "            gp2Scale = True, gp2Scale_batch_size= 500, gp2Scale_dask_client = client,\n",
    "                      gp_kernel_function=gibbs_wendland, noise_variances=np.zeros(y_train_1d.shape) + 0.01)\n",
    "\n",
    "my_gp2S.train(hyperparameter_bounds=hps_bounds, max_iter = 10000, info = True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4aeeb632-0b96-419d-a9fd-fbd1716e5b9d",
   "metadata": {},
   "outputs": [],
   "source": [
    "rmse = my_gp2S.rmse(x_test_1d, y_test_1d)\n",
    "print(rmse)\n",
    "\n",
    "crps = my_gp2S.crps(x_test_1d, y_test_1d)\n",
    "print(crps)\n",
    "\n",
    "\n",
    "mean_pred = my_gp2S.posterior_mean(x_test_1d)[\"f(x)\"]\n",
    "cov_pred = my_gp2S.posterior_covariance(x_test_1d)[\"v(x)\"]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "160c872a-2167-4c81-a4c4-770727a798bf",
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.figure(figsize = (15,5))\n",
    "plt.xticks([0.,0.5,1.0])\n",
    "plt.yticks([-2,-1,0.,1])\n",
    "plt.xticks(fontsize=20)\n",
    "plt.yticks(fontsize=20)\n",
    "plt.plot(x_pred1D,f1(x_pred1D), color = 'orange', linewidth = 2, label=\"f(x)\")\n",
    "plt.scatter(x_train_1d[:,0],y_train_1d, color = 'grey', s=2., label = \"data\")\n",
    "plt.scatter(x_test_1d, mean_pred, label = \"predictions\")\n",
    "plt.legend()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e6003605-4e56-4323-8455-34a1496250c0",
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.plot(x_pred1D, sig(x_pred1D,my_gp2S.get_hyperparameters()))\n",
    "plt.show()\n",
    "plt.plot(x_pred1D, rad(x_pred1D,my_gp2S.get_hyperparameters()))\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6beb1386",
   "metadata": {},
   "outputs": [],
   "source": [
    "res = np.hstack([x_test_1d.reshape(-1,1), mean_pred.reshape(-1,1), cov_pred.reshape(-1,1)])\n",
    "np.savetxt(\"gp2ScaleResult1D.csv\", res)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "763b2fa6-2d4e-4d50-b560-2b9e2a0af682",
   "metadata": {},
   "source": [
    "## Base GP"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fa0e17c0-fb1d-4936-9129-c55e3689e464",
   "metadata": {},
   "outputs": [],
   "source": [
    "hps_bounds = np.array([[0.01,4.],      ##signal var of Wendland kernel\n",
    "                       [0.001,1.05]])  ##length scale for Wendland kernel\n",
    "\n",
    "\n",
    "from gpcam.gp_kernels import *\n",
    "def kernel(x1,x2, hps):\n",
    "    d = get_distance_matrix(x1,x2)\n",
    "    return hps[0] * squared_exponential_kernel(d,hps[1])\n",
    "\n",
    "init_hps = np.random.uniform(size = len(hps_bounds), low = hps_bounds[:,0], high = hps_bounds[:,1])\n",
    "my_gp2S = GPOptimizer(x_train_1d, y_train_1d, init_hyperparameters=init_hps, gp_kernel_function=kernel,\n",
    "                      noise_variances=np.zeros(y_train_1d.shape) + 0.01)\n",
    "\n",
    "my_gp2S.train(hyperparameter_bounds=hps_bounds, max_iter = 500, method = \"mcmc\", info = True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "de214939-c84f-42dd-bf8f-2cb76c73e026",
   "metadata": {},
   "outputs": [],
   "source": [
    "mean_pred = my_gp2S.posterior_mean(x_test_1d)[\"f(x)\"]\n",
    "#print(mean_pred)\n",
    "cov_pred = my_gp2S.posterior_covariance(x_test_1d)[\"v(x)\"]\n",
    "#print(mean_pred)\n",
    "\n",
    "\n",
    "print(my_gp2S.rmse(x_test_1d,y_test_1d))\n",
    "print(my_gp2S.crps(x_test_1d,y_test_1d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "32ef3e63-aa86-4134-b7ec-48ec6a44f26a",
   "metadata": {},
   "outputs": [],
   "source": [
    "res = np.hstack([x_test_1d.reshape(-1,1), mean_pred.reshape(-1,1), cov_pred.reshape(-1,1)])\n",
    "\n",
    "\n",
    "np.savetxt(\"BaseGPResult1D.csv\", res)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "1denv",
   "language": "python",
   "name": "1denv"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
