{
  "nbformat": 4,
  "nbformat_minor": 0,
  "metadata": {
    "colab": {
      "provenance": [],
      "gpuType": "V28"
    },
    "kernelspec": {
      "name": "python3",
      "display_name": "Python 3"
    },
    "language_info": {
      "name": "python"
    },
    "accelerator": "TPU"
  },
  "cells": [
    {
      "cell_type": "code",
      "source": [
        "import pandas as pd\n",
        "import numpy as np\n",
        "import matplotlib.pyplot as plt\n",
        "import gpytorch\n",
        "import torch\n",
        "import plotly.graph_objects as go\n",
        "from scipy.stats import norm\n"
      ],
      "metadata": {
        "id": "epGv2RmIoWsc"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "base_path = \"/content/drive/MyDrive/Experiments/CA_Housing/\"\n",
        "\n",
        "X_train = pd.read_csv(base_path + \"x_train_CAhousing.csv\", header=None, sep='\\s+').values.astype(np.float32)\n",
        "y_train = pd.read_csv(base_path + \"y_train_CAhousing.csv\", header=None, sep='\\s+').values.astype(np.float32).flatten()\n",
        "X_test  = pd.read_csv(base_path + \"x_test_CAhousing.csv\", header=None, sep='\\s+').values.astype(np.float32)\n",
        "y_test  = pd.read_csv(base_path + \"y_test_CAhousing.csv\", header=None, sep='\\s+').values.astype(np.float32).flatten()\n",
        "\n",
        "device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
        "# Ensure inputs are of shape (n_samples, num_features)\n",
        "X_train_tensor = torch.from_numpy(X_train).to(device)\n",
        "y_train_tensor = torch.from_numpy(y_train).to(device)\n",
        "X_test_tensor  = torch.from_numpy(X_test).to(device)\n",
        "y_test_tensor  = torch.from_numpy(y_test).to(device)"
      ],
      "metadata": {
        "id": "CswKpD41oWky"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "grid_bounds = []\n",
        "for i in range(X_train.shape[1]):\n",
        "    mn = X_train[:, i].min().item()\n",
        "    mx = X_train[:, i].max().item()\n",
        "    grid_bounds.append((mn, mx))\n"
      ],
      "metadata": {
        "id": "jgUTpXagobsg"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Define the GP regression model using SKI with additive structure.\n",
        "class GPRegressionModel(gpytorch.models.ExactGP):\n",
        "    def __init__(self, train_x, train_y, likelihood):\n",
        "        super(GPRegressionModel, self).__init__(train_x, train_y, likelihood)\n",
        "        self.mean_module = gpytorch.means.ConstantMean()\n",
        "        base_kernel = gpytorch.kernels.RBFKernel()\n",
        "        # Use a fixed grid size for each 1D kernel. Here we choose 128 inducing points per dimension.\n",
        "        # We set kronecker_structure=False so that the grid is computed independently per dimension.\n",
        "        grid_size = 30\n",
        "        # The base kernel (wrapped in GridInterpolationKernel) acts on one dimension:\n",
        "        base_kernel_interp = gpytorch.kernels.GridInterpolationKernel(\n",
        "            base_kernel, grid_size=grid_size, num_dims=1\n",
        "        )\n",
        "        # The AdditiveStructureKernel wraps the base kernel so that it acts independently\n",
        "        # on each feature and then sums the resulting 1D covariance matrices.\n",
        "        # Set num_dims equal to the number of features in the input.\n",
        "        num_features = train_x.size(-1)\n",
        "        self.covar_module = gpytorch.kernels.AdditiveStructureKernel(\n",
        "            gpytorch.kernels.ScaleKernel(base_kernel_interp),\n",
        "            num_dims=num_features\n",
        "        )\n",
        "\n",
        "    def forward(self, x):\n",
        "        mean_x = self.mean_module(x)\n",
        "        covar_x = self.covar_module(x)\n",
        "        return gpytorch.distributions.MultivariateNormal(mean_x, covar_x)"
      ],
      "metadata": {
        "id": "l4Jx5wuboe3w"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Create likelihood and model using the full dataset\n",
        "likelihood = gpytorch.likelihoods.GaussianLikelihood().to(device)\n",
        "model = GPRegressionModel(X_train_tensor, y_train_tensor, likelihood).to(device)\n",
        "\n",
        "model.train()\n",
        "likelihood.train()\n",
        "\n",
        "optimizer = torch.optim.Adam(model.parameters(), lr=0.1)\n",
        "mll = gpytorch.mlls.ExactMarginalLogLikelihood(likelihood, model)\n",
        "\n",
        "def train_ski(num_epochs=100):\n",
        "    for i in range(num_epochs):\n",
        "        optimizer.zero_grad()\n",
        "        # Use the same training inputs as at model creation.\n",
        "        output = model(X_train_tensor)\n",
        "        loss = -mll(output, y_train_tensor)\n",
        "        loss.backward()\n",
        "        optimizer.step()\n",
        "        print(f'Epoch {i + 1}/{num_epochs} - Loss: {loss.item():.3f}')\n",
        "\n",
        "def predict(x_new):\n",
        "    model.eval()\n",
        "    likelihood.eval()\n",
        "    with torch.no_grad(), gpytorch.settings.fast_pred_var():\n",
        "        pred_dist = likelihood(model(x_new))\n",
        "        mean = pred_dist.mean\n",
        "        std = pred_dist.stddev\n",
        "    return mean, std\n"
      ],
      "metadata": {
        "id": "ZnQaHeh8ohOp"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "train_ski(num_epochs=25)"
      ],
      "metadata": {
        "id": "gwDWu18MonRZ"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "checkpoint_path = base_path + \"ski_checkpoint.pth\"\n",
        "torch.save({\n",
        "    'model_state_dict': model.state_dict(),\n",
        "    'likelihood_state_dict': likelihood.state_dict(),\n",
        "    'optimizer_state_dict': optimizer.state_dict()\n",
        "}, checkpoint_path)\n"
      ],
      "metadata": {
        "id": "NWhTBVd7XDBx"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "pred_mean_ski, pred_std_ski = predict(X_test_tensor)"
      ],
      "metadata": {
        "id": "GO1gMUnWvPAp"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def crps_gaussian(y, mu, sigma):\n",
        "    z = (y - mu) / sigma\n",
        "    crps = sigma * (z * (2 * norm.cdf(z) - 1) + 2 * norm.pdf(z) - 1 / np.sqrt(np.pi))\n",
        "    return crps\n",
        "\n",
        "rmse = np.sqrt(np.mean((pred_mean_ski.cpu().numpy() - y_test)**2))\n",
        "print(f\"RMSE: {rmse}\")\n",
        "\n",
        "crps_values = crps_gaussian(y_test, pred_mean_ski.cpu().numpy(), pred_std_ski.cpu().numpy())\n",
        "mean_crps = np.mean(crps_values)\n",
        "print(f\"Mean CRPS: {mean_crps}\")"
      ],
      "metadata": {
        "id": "zVK-e6oKyGhk"
      },
      "execution_count": null,
      "outputs": []
    }
  ]
}