{
  "cells": [
    {
      "cell_type": "markdown",
      "id": "f2a722d1",
      "metadata": {
        "id": "f2a722d1"
      },
      "source": [
        "# Libraries"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "e605f985",
      "metadata": {
        "id": "e605f985"
      },
      "outputs": [],
      "source": [
        "import numpy as np\n",
        "import matplotlib.pyplot as plt\n",
        "from scipy.integrate import odeint\n",
        "from sklearn.linear_model import Ridge\n",
        "from matplotlib.colors import Normalize\n",
        "import networkx as nx\n",
        "from scipy.signal import welch\n",
        "import matplotlib.cm as cm\n",
        "import seaborn as sns\n",
        "from collections import defaultdict\n",
        "from sklearn.decomposition import PCA\n",
        "from sklearn.preprocessing import MinMaxScaler\n",
        "import torch\n",
        "import torch.nn as nn\n",
        "from torch.optim import Adam\n",
        "from itertools import combinations_with_replacement"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "cba69c65",
      "metadata": {
        "id": "cba69c65"
      },
      "source": [
        "# Utils"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "4984ec68",
      "metadata": {
        "id": "4984ec68"
      },
      "outputs": [],
      "source": [
        "def scale_spectral_radius(W, target_radius=0.95):\n",
        "    \"\"\"\n",
        "    Scales a matrix W so that its largest eigenvalue magnitude = target_radius.\n",
        "    \"\"\"\n",
        "    eigvals = np.linalg.eigvals(W)\n",
        "    radius = np.max(np.abs(eigvals))\n",
        "    if radius == 0:\n",
        "        return W\n",
        "    return (W / radius) * target_radius"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c3ecdba6",
      "metadata": {
        "id": "c3ecdba6"
      },
      "outputs": [],
      "source": [
        "def augment_state_with_squares(x):\n",
        "    \"\"\"\n",
        "    Given state vector x in R^N, return [ x, x^2, 1 ] in R^(2N+1).\n",
        "    We'll use this for both training and prediction.\n",
        "    \"\"\"\n",
        "    x_sq = x**2\n",
        "    return np.concatenate([x, x_sq, [1.0]])  # shape: 2N+1"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "97207c33",
      "metadata": {
        "id": "97207c33"
      },
      "outputs": [],
      "source": [
        "def plot_pca_projection3d(states):\n",
        "    # Apply PCA for 3D visualization\n",
        "    pca = PCA(n_components=3)\n",
        "    proj = pca.fit_transform(states)\n",
        "\n",
        "    sns.set_theme(style=\"white\")\n",
        "    fig = plt.figure(figsize=(12, 9))  \n",
        "    ax = plt.axes(projection='3d')\n",
        "\n",
        "    # Scatter plot\n",
        "    p = ax.scatter(proj[:, 0], proj[:, 1], proj[:, 2],\n",
        "                   c=np.arange(len(proj)), cmap='viridis', s=2.5)\n",
        "\n",
        "    # Axis labels with padding\n",
        "    ax.set_xlabel(\"PC1\")\n",
        "    ax.set_ylabel(\"PC2\")\n",
        "    ax.set_zlabel(\"PC3\")\n",
        "\n",
        "    cbar = fig.colorbar(p, ax=ax, shrink=0.6, pad=0.1)\n",
        "    cbar.set_label(\"Index progression\")\n",
        "\n",
        "    plt.savefig('Figures/PCA_projection_2d_rossler_trigr.png', dpi=400)\n",
        "    plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "399a9166",
      "metadata": {
        "id": "399a9166"
      },
      "outputs": [],
      "source": [
        "def plot_pca_projection2d(states):\n",
        "    # Apply PCA for 3D visualization\n",
        "    pca = PCA(n_components=2)\n",
        "    proj = pca.fit_transform(states)\n",
        "\n",
        "    sns.set_theme(style=\"white\")\n",
        "    fig = plt.figure(figsize=(10, 7))\n",
        "    ax = fig.add_subplot(111)\n",
        "    p = ax.scatter(proj[:, 0], proj[:, 1], c=np.arange(len(proj)), cmap='plasma', s=2.5)\n",
        "\n",
        "    ax.set_xlabel(\"PC1\")\n",
        "    ax.set_ylabel(\"PC2\")\n",
        "    plt.savefig('Figures/PCA_projection_3d_rossler_trigr.png', dpi=400)\n",
        "    plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "69cfe8ac",
      "metadata": {
        "id": "69cfe8ac"
      },
      "outputs": [],
      "source": [
        "import matplotlib.colors as colors\n",
        "import matplotlib.gridspec as gridspec\n",
        "\n",
        "def visualize_sparsity(matrix1, matrix2):\n",
        "        combined = np.stack([matrix1, matrix2])\n",
        "        min_nonzero = np.min(combined[combined > 0])\n",
        "        small_value = min_nonzero / 1000\n",
        "        vmax = np.max(combined)\n",
        "        norm = colors.LogNorm(vmin=small_value, vmax=vmax)\n",
        "\n",
        "        # Setup figure and gridspec\n",
        "        fig = plt.figure(figsize=(20, 8))\n",
        "        gs = gridspec.GridSpec(1, 3, width_ratios=[1, 1, 0.05], wspace=0.05)\n",
        "\n",
        "        ax1 = plt.subplot(gs[0])\n",
        "        ax2 = plt.subplot(gs[1])\n",
        "        cbar_ax = plt.subplot(gs[2])  \n",
        "\n",
        "        # Plot first matrix\n",
        "        sns.heatmap(matrix1, cmap='twilight', ax=ax1, norm=norm, mask=(matrix1 == 0), cbar=False)\n",
        "        ax1.axis('off')\n",
        "\n",
        "        # Plot second matrix\n",
        "        sns.heatmap(matrix2, cmap='twilight', ax=ax2, norm=norm, mask=(matrix2 == 0),\n",
        "                        cbar=True, cbar_ax=cbar_ax)\n",
        "        ax2.axis('off')\n",
        "        plt.savefig('Figures/Sparsity Visualization.png', dpi=400)\n",
        "        plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "e9023f48",
      "metadata": {
        "id": "e9023f48"
      },
      "outputs": [],
      "source": [
        "def create_delay_embedding(signal, embed_dim):\n",
        "    L = len(signal) - embed_dim + 1\n",
        "    emb = np.zeros((L, embed_dim))\n",
        "    for i in range(L):\n",
        "        emb[i, :] = signal[i:i+embed_dim]\n",
        "    return emb"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "c6ac8933",
      "metadata": {
        "id": "c6ac8933"
      },
      "source": [
        "# Baselines"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "8a500e05",
      "metadata": {
        "id": "8a500e05"
      },
      "source": [
        "### Baseline ESN"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "b84b674e",
      "metadata": {
        "id": "b84b674e"
      },
      "outputs": [],
      "source": [
        "class ESN3D:\n",
        "    \"\"\"\n",
        "    Sparse random ESN for 3D->3D single-step,\n",
        "    teacher forcing for training, autoregressive for testing.\n",
        "    \"\"\"\n",
        "    def __init__(self,\n",
        "                 reservoir_size=300,\n",
        "                 spectral_radius=0.95,\n",
        "                 connectivity=0.05,\n",
        "                 input_scale=1.0,\n",
        "                 leaking_rate=1.0,\n",
        "                 ridge_alpha=1e-6,\n",
        "                 seed=42):\n",
        "        self.reservoir_size = reservoir_size\n",
        "        self.spectral_radius = spectral_radius\n",
        "        self.connectivity = connectivity\n",
        "        self.input_scale = input_scale\n",
        "        self.leaking_rate = leaking_rate\n",
        "        self.ridge_alpha = ridge_alpha\n",
        "        self.seed = seed\n",
        "\n",
        "        np.random.seed(self.seed)\n",
        "        W_full = np.random.randn(reservoir_size, reservoir_size)*0.1\n",
        "        mask = (np.random.rand(reservoir_size, reservoir_size) < self.connectivity)\n",
        "        W = W_full * mask\n",
        "        W = scale_spectral_radius(W, self.spectral_radius)\n",
        "        self.W = W\n",
        "\n",
        "        np.random.seed(self.seed+1)\n",
        "        self.W_in = (np.random.rand(reservoir_size,3) - 0.5)*2.0*self.input_scale\n",
        "\n",
        "        self.W_out = None\n",
        "        self.x = np.zeros(reservoir_size)\n",
        "\n",
        "    def reset_state(self):\n",
        "        self.x = np.zeros(self.reservoir_size)\n",
        "\n",
        "    def _update(self, u):\n",
        "        pre_activation = self.W @ self.x + self.W_in @ u\n",
        "        x_new = np.tanh(pre_activation)\n",
        "        alpha = self.leaking_rate\n",
        "        self.x = (1.0 - alpha)*self.x + alpha*x_new\n",
        "\n",
        "    def collect_states(self, inputs, discard=100):\n",
        "        self.reset_state()\n",
        "        states = []\n",
        "        for val in inputs:\n",
        "            self._update(val)\n",
        "            states.append(self.x.copy())\n",
        "        states = np.array(states)\n",
        "        return states[discard:], states[:discard]\n",
        "\n",
        "    def fit_readout(self, train_input, train_target, discard=100):\n",
        "        states_use, _ = self.collect_states(train_input, discard=discard)\n",
        "        targets_use = train_target[discard:]\n",
        "        # X_aug = np.hstack([states_use, np.ones((states_use.shape[0],1))])\n",
        "\n",
        "        # polynomial readout\n",
        "        X_list = []\n",
        "        for s in states_use:\n",
        "            X_list.append(augment_state_with_squares(s))\n",
        "        X_aug = np.array(X_list)  # shape => [T-discard, 2N+1]\n",
        "\n",
        "        reg = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        reg.fit(X_aug, targets_use)\n",
        "        self.W_out = reg.coef_\n",
        "\n",
        "    def predict_autoregressive(self, initial_input, n_steps):\n",
        "        preds = []\n",
        "        current_in = np.array(initial_input)\n",
        "        for _ in range(n_steps):\n",
        "            self._update(current_in)\n",
        "            # x_aug = np.concatenate([self.x, [1.0]])\n",
        "            x_aug = augment_state_with_squares(self.x)\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "            current_in = out\n",
        "        return np.array(preds)\n",
        "\n",
        "    def predict_open_loop(self, test_input):\n",
        "        preds = []\n",
        "        for true_input in test_input:\n",
        "            self._update(true_input)\n",
        "            x_aug = augment_state_with_squares(self.x)\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "        return np.array(preds)\n"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "085ffac6",
      "metadata": {
        "id": "085ffac6"
      },
      "source": [
        "### SCR"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "36365c50",
      "metadata": {
        "id": "36365c50"
      },
      "outputs": [],
      "source": [
        "class CR3D:\n",
        "    \"\"\"\n",
        "    Cycle (ring) reservoir for 3D->3D single-step,\n",
        "    teacher forcing for training, autoregressive for testing.\n",
        "    \"\"\"\n",
        "    def __init__(self,\n",
        "                 reservoir_size=300,\n",
        "                 spectral_radius=0.95,\n",
        "                 input_scale=1.0,\n",
        "                 leaking_rate=1.0,\n",
        "                 ridge_alpha=1e-6,\n",
        "                 seed=42):\n",
        "        self.reservoir_size = reservoir_size\n",
        "        self.spectral_radius = spectral_radius\n",
        "        self.input_scale = input_scale\n",
        "        self.leaking_rate = leaking_rate\n",
        "        self.ridge_alpha = ridge_alpha\n",
        "        self.seed = seed\n",
        "\n",
        "        np.random.seed(self.seed)\n",
        "        W = np.zeros((reservoir_size, reservoir_size))\n",
        "        for i in range(reservoir_size):\n",
        "            j = (i+1) % reservoir_size\n",
        "            W[i, j] = 1.0\n",
        "        W = scale_spectral_radius(W, self.spectral_radius)\n",
        "        self.W = W\n",
        "\n",
        "        np.random.seed(self.seed+1)\n",
        "        self.W_in = (np.random.rand(reservoir_size,3) - 0.5)*2.0*self.input_scale\n",
        "\n",
        "        self.W_out = None\n",
        "        self.x = np.zeros(reservoir_size)\n",
        "\n",
        "    def reset_state(self):\n",
        "        self.x = np.zeros(self.reservoir_size)\n",
        "\n",
        "    def _update(self, u):\n",
        "        pre_activation = self.W @ self.x + self.W_in @ u\n",
        "        x_new = np.tanh(pre_activation)\n",
        "        alpha = self.leaking_rate\n",
        "        self.x = (1.0 - alpha)*self.x + alpha*x_new\n",
        "\n",
        "    def collect_states(self, inputs, discard=100):\n",
        "        self.reset_state()\n",
        "        states = []\n",
        "        for val in inputs:\n",
        "            self._update(val)\n",
        "            states.append(self.x.copy())\n",
        "        states = np.array(states)\n",
        "        return states[discard:], states[:discard]\n",
        "\n",
        "    def fit_readout(self, train_input, train_target, discard=100):\n",
        "        states_use, _ = self.collect_states(train_input, discard=discard)\n",
        "        targets_use = train_target[discard:]\n",
        "        # X_aug = np.hstack([states_use, np.ones((states_use.shape[0],1))])\n",
        "\n",
        "        # polynomial readout\n",
        "        X_list = []\n",
        "        for s in states_use:\n",
        "            X_list.append(augment_state_with_squares(s))\n",
        "        X_aug = np.array(X_list)  # shape => [T-discard, 2N+1]\n",
        "\n",
        "        reg = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        reg.fit(X_aug, targets_use)\n",
        "        self.W_out = reg.coef_\n",
        "\n",
        "    def predict_autoregressive(self, initial_input, n_steps):\n",
        "        preds = []\n",
        "        current_in = np.array(initial_input)\n",
        "        for _ in range(n_steps):\n",
        "            self._update(current_in)\n",
        "            # x_aug = np.concatenate([self.x, [1.0]])\n",
        "            x_aug = augment_state_with_squares(self.x)\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "            current_in = out\n",
        "        return np.array(preds)\n",
        "\n",
        "    def predict_open_loop(self, test_input):\n",
        "        preds = []\n",
        "        for true_input in test_input:\n",
        "            self._update(true_input)\n",
        "            x_aug = augment_state_with_squares(self.x)\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "        return np.array(preds)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "7b01cc9a",
      "metadata": {
        "id": "7b01cc9a"
      },
      "source": [
        "### CRJ"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "deb13644",
      "metadata": {
        "id": "deb13644"
      },
      "outputs": [],
      "source": [
        "class CRJ3D:\n",
        "    \"\"\"\n",
        "    Cycle Reservoir with Jumps (CRJ) for 3D->3D single-step tasks.\n",
        "    We form a ring adjacency with an extra 'jump' edge in each row.\n",
        "    This can help capture multiple timescales or delayed memory\n",
        "    while retaining the easy ring structure.\n",
        "\n",
        "    The adjacency is built as follows (reservoir_size = mod N):\n",
        "      For each i in [0..N-1]:\n",
        "        W[i, (i+1) % mod N] = 1.0\n",
        "        W[i, (i+jump) % mod N] = 1.0\n",
        "    Then we scale by 'spectral_radius.' We do an ESN update\n",
        "    with readout [ x, x^2, 1 ] -> next step in R^3.\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(self,\n",
        "                 reservoir_size=300,\n",
        "                 jump=10,                # offset for the jump\n",
        "                 spectral_radius=0.95,\n",
        "                 input_scale=1.0,\n",
        "                 leaking_rate=1.0,\n",
        "                 ridge_alpha=1e-6,\n",
        "                 seed=42):\n",
        "        \"\"\"\n",
        "        reservoir_size: how many nodes in the ring\n",
        "        jump            : the offset for the 2nd connection from node i\n",
        "        spectral_radius : scale adjacency\n",
        "        input_scale     : scale factor for W_in\n",
        "        leaking_rate    : ESN 'alpha'\n",
        "        ridge_alpha     : ridge penalty for readout\n",
        "        seed            : random seed\n",
        "        \"\"\"\n",
        "        self.reservoir_size = reservoir_size\n",
        "        self.jump = jump\n",
        "        self.spectral_radius = spectral_radius\n",
        "        self.input_scale = input_scale\n",
        "        self.leaking_rate = leaking_rate\n",
        "        self.ridge_alpha = ridge_alpha\n",
        "        self.seed = seed\n",
        "\n",
        "        # build adjacency\n",
        "        np.random.seed(self.seed)\n",
        "        W = np.zeros((reservoir_size, reservoir_size))\n",
        "        for i in range(reservoir_size):\n",
        "            # cycle edge: i -> (i+1)%N\n",
        "            W[i, (i+1) % reservoir_size] = 1.0\n",
        "            # jump edge: i -> (i+jump)%N\n",
        "            W[i, (i + self.jump) % reservoir_size] = 1.0\n",
        "\n",
        "        # scale spectral radius\n",
        "        W = scale_spectral_radius(W, self.spectral_radius)\n",
        "        self.W = W\n",
        "\n",
        "        # input weights => shape [N,3]\n",
        "        np.random.seed(self.seed+100)\n",
        "        W_in = (np.random.rand(reservoir_size, 3) - 0.5)*2.0*self.input_scale\n",
        "        self.W_in = W_in\n",
        "\n",
        "        # readout\n",
        "        self.W_out = None\n",
        "        self.x = np.zeros(self.reservoir_size)\n",
        "\n",
        "    def reset_state(self):\n",
        "        self.x = np.zeros(self.reservoir_size)\n",
        "\n",
        "    def _update(self, u):\n",
        "        \"\"\"\n",
        "        Single-step ESN update:\n",
        "          x(t+1) = (1-alpha)*x(t) + alpha*tanh( W x(t) + W_in u(t) )\n",
        "        \"\"\"\n",
        "        pre_activation = self.W @ self.x + self.W_in @ u\n",
        "        x_new = np.tanh(pre_activation)\n",
        "        alpha = self.leaking_rate\n",
        "        self.x = (1.0 - alpha)*self.x + alpha*x_new\n",
        "\n",
        "    def collect_states(self, inputs, discard=100):\n",
        "        \"\"\"\n",
        "        Teacher forcing => feed the real 3D inputs => gather states.\n",
        "        Return (states_after_discard, states_discarded).\n",
        "        \"\"\"\n",
        "        self.reset_state()\n",
        "        states = []\n",
        "        for val in inputs:\n",
        "            self._update(val)\n",
        "            states.append(self.x.copy())\n",
        "        states = np.array(states)\n",
        "        return states[discard:], states[:discard]\n",
        "\n",
        "    def fit_readout(self, train_input, train_target, discard=100):\n",
        "        \"\"\"\n",
        "        gather states => polynomial readout => solve ridge\n",
        "        \"\"\"\n",
        "        states_use, _ = self.collect_states(train_input, discard=discard)\n",
        "        target_use = train_target[discard:]\n",
        "        X_list = []\n",
        "        for s in states_use:\n",
        "            # polynomial expansion => [ x, x^2, 1 ]\n",
        "            X_list.append(augment_state_with_squares(s))\n",
        "        X_aug = np.array(X_list)\n",
        "\n",
        "        reg = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        reg.fit(X_aug, target_use)\n",
        "        self.W_out = reg.coef_  # shape => (3, 2N+1)\n",
        "\n",
        "    def predict_autoregressive(self, initial_input, n_steps):\n",
        "        \"\"\"\n",
        "        fully autoregressive => feed last output => next input\n",
        "        \"\"\"\n",
        "        preds = []\n",
        "        #self.reset_state()\n",
        "        current_in = np.array(initial_input)\n",
        "        for _ in range(n_steps):\n",
        "            self._update(current_in)\n",
        "            big_x = augment_state_with_squares(self.x)\n",
        "            out = self.W_out @ big_x  # shape => (3,)\n",
        "            preds.append(out)\n",
        "            current_in = out\n",
        "        return np.array(preds)\n",
        "\n",
        "    def predict_open_loop(self, test_input):\n",
        "        preds = []\n",
        "        for true_input in test_input:\n",
        "            self._update(true_input)\n",
        "            x_aug = augment_state_with_squares(self.x)\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "        return np.array(preds)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "22e8a8e0",
      "metadata": {
        "id": "22e8a8e0"
      },
      "source": [
        "### Small-World Res"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "5d8ea5bc",
      "metadata": {
        "id": "5d8ea5bc"
      },
      "outputs": [],
      "source": [
        "class SWRes3D:\n",
        "    \"\"\"\n",
        "    Small-World Reservoir ESN for 3D -> 3D single-step prediction.\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(self,\n",
        "                 reservoir_size=300,\n",
        "                 rewiring_prob=0.1,\n",
        "                 degree=6,\n",
        "                 spectral_radius=0.95,\n",
        "                 input_scale=1.0,\n",
        "                 leaking_rate=1.0,\n",
        "                 ridge_alpha=1e-6,\n",
        "                 activation_choices=('tanh', 'relu', 'sin', 'linear'),\n",
        "                 seed=42):\n",
        "\n",
        "        self.reservoir_size = reservoir_size\n",
        "        self.rewiring_prob = rewiring_prob\n",
        "        self.degree = degree\n",
        "        self.spectral_radius = spectral_radius\n",
        "        self.input_scale = input_scale\n",
        "        self.leaking_rate = leaking_rate\n",
        "        self.ridge_alpha = ridge_alpha\n",
        "        self.activation_choices = activation_choices\n",
        "        self.seed = seed\n",
        "\n",
        "        np.random.seed(self.seed)\n",
        "        ws_graph = nx.watts_strogatz_graph(n=reservoir_size, k=degree, p=rewiring_prob, seed=seed)\n",
        "        A = nx.to_numpy_array(ws_graph)\n",
        "        W = A * np.random.uniform(-1, 1, size=A.shape)\n",
        "        self.W = scale_spectral_radius(W, spectral_radius)\n",
        "\n",
        "        np.random.seed(self.seed + 100)\n",
        "        self.W_in = (np.random.rand(reservoir_size, 3) - 0.5) * 2 * input_scale\n",
        "\n",
        "        np.random.seed(self.seed + 200)\n",
        "        self.node_activations = np.random.choice(activation_choices, size=reservoir_size)\n",
        "\n",
        "        self.reset_state()\n",
        "        self.W_out = None\n",
        "\n",
        "    def reset_state(self):\n",
        "        self.x = np.zeros(self.reservoir_size)\n",
        "\n",
        "    def _apply_activation(self, kind, val):\n",
        "        return np.tanh(val)\n",
        "\n",
        "    def _update(self, u):\n",
        "        pre = self.W @ self.x + self.W_in @ u\n",
        "        x_new = np.zeros_like(self.x)\n",
        "        for i in range(self.reservoir_size):\n",
        "            act = self.node_activations[i]\n",
        "            x_new[i] = self._apply_activation(act, pre[i])\n",
        "        self.x = (1 - self.leaking_rate) * self.x + self.leaking_rate * x_new\n",
        "\n",
        "    def collect_states(self, inputs, discard=100):\n",
        "        self.reset_state()\n",
        "        states = []\n",
        "        for u in inputs:\n",
        "            self._update(u)\n",
        "            states.append(self.x.copy())\n",
        "        return np.array(states)[discard:], np.array(states)[:discard]\n",
        "\n",
        "    def fit_readout(self, train_input, train_target, discard=100):\n",
        "        states, _ = self.collect_states(train_input, discard=discard)\n",
        "        targets = train_target[discard:]\n",
        "\n",
        "        X_aug = np.hstack([states, states**2, np.ones((len(states), 1))])\n",
        "        ridge = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        ridge.fit(X_aug, targets)\n",
        "        self.W_out = ridge.coef_\n",
        "\n",
        "    def predict_open_loop(self, inputs):\n",
        "        preds = []\n",
        "        for u in inputs:\n",
        "            self._update(u)\n",
        "            x_aug = np.concatenate([self.x, self.x**2, [1.0]])\n",
        "            preds.append(self.W_out @ x_aug)\n",
        "        return np.array(preds)\n",
        "\n",
        "    def predict_autoregressive(self, initial_input, num_steps):\n",
        "        preds = []\n",
        "        current = initial_input.copy()\n",
        "        for _ in range(num_steps):\n",
        "            self._update(current)\n",
        "            x_aug = np.concatenate([self.x, self.x**2, [1.0]])\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "            current = out\n",
        "        return np.array(preds)\n"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "d82cfc0d",
      "metadata": {
        "id": "d82cfc0d"
      },
      "source": [
        "### MCI-ESN"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "5a28cfbc",
      "metadata": {
        "id": "5a28cfbc"
      },
      "outputs": [],
      "source": [
        "class MCI3D:\n",
        "    \"\"\"\n",
        "    Minimum Complexity Interaction ESN (MCI-ESN).\n",
        "\n",
        "    This class implements the approach described in:\n",
        "      \"A Minimum Complexity Interaction Echo State Network\"\n",
        "        by Jianming Liu, Xu Xu, Eric Li (2024).\n",
        "\n",
        "    The model structure:\n",
        "      - We maintain two 'simple cycle' reservoirs (each of size N).\n",
        "      - Each reservoir is a ring with weight = l, i.e.\n",
        "            W_res[i, (i+1)%N] = l\n",
        "        plus the corner wrap from (N-1)->0, also = l. \n",
        "      - The two reservoirs interact via a minimal connection matrix:\n",
        "         exactly 2 cross-connections with weight = g.\n",
        "         (One might connect x2[-1], x2[-2], ...\n",
        "          But we do where reservoir1 sees x2[-1]\n",
        "          in one location, and reservoir2 sees x1[-1] likewise.)\n",
        "      - Activation function in reservoir1 is cos(·), and in reservoir2 is sin(·).\n",
        "      - They each have a separate input weight matrix: Win1 and Win2.\n",
        "        The final state is a linear combination\n",
        "           x(t) = h*x1(t) + (1-h)*x2(t).\n",
        "      - Then we do a polynomial readout [x, x^2, 1] -> output.\n",
        "      - We feed teacher forcing in collect_states,\n",
        "        then solve readout with Ridge regression.\n",
        "\n",
        "    References:\n",
        "      - Liu, J., Xu, X., & Li, E. (2024).\n",
        "        \"A minimum complexity interaction echo state network,\"\n",
        "         Neural Computing and Applications.\n",
        "\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(\n",
        "        self,\n",
        "        reservoir_size=300,\n",
        "        cycle_weight=0.9,      # 'l' in the paper\n",
        "        connect_weight=0.9,    # 'g' in the paper\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=1.0,\n",
        "        ridge_alpha=1e-6,\n",
        "        combine_factor=0.1,    # 'h' in the paper\n",
        "        seed=47,\n",
        "        v1=0.6, v2=0.6         # fixed values for v1, v2\n",
        "    ):\n",
        "        \"\"\"\n",
        "        reservoir_size: N, size of each cycle reservoir\n",
        "        cycle_weight : l, ring adjacency weight in [0,1), ensures cycle synergy\n",
        "        connect_weight: g, cross-connection weight between the two cycle reservoirs\n",
        "        input_scale   : scale factor for input->reservoir weights\n",
        "        leaking_rate  : ESN update alpha\n",
        "        ridge_alpha   : readout ridge penalty\n",
        "        combine_factor: h in [0,1], to form x(t)= h*x1(t)+(1-h)*x2(t) as final combined state\n",
        "        seed          : random seed\n",
        "        \"\"\"\n",
        "        self.reservoir_size = reservoir_size\n",
        "        self.cycle_weight   = cycle_weight\n",
        "        self.connect_weight = connect_weight\n",
        "        self.input_scale    = input_scale\n",
        "        self.leaking_rate   = leaking_rate\n",
        "        self.ridge_alpha    = ridge_alpha\n",
        "        self.combine_factor = combine_factor\n",
        "        self.seed           = seed\n",
        "        self.v1 = v1\n",
        "        self.v2 = v2\n",
        "\n",
        "        # We'll define (and build) adjacency for each cycle,\n",
        "        # plus cross-connection for two sub-reservoirs.\n",
        "        # We'll define 2 input weight mats: Win1, Win2.\n",
        "        # We'll define states x1(t), x2(t).\n",
        "        # We'll define readout W_out after training.\n",
        "\n",
        "        self._build_mci_esn()\n",
        "\n",
        "    def _build_mci_esn(self):\n",
        "        \"\"\"\n",
        "        Build all the internal parameters:\n",
        "         - ring adjacency for each reservoir\n",
        "         - cross-reservoir connection\n",
        "         - input weights for each reservoir\n",
        "         - initial states\n",
        "        \"\"\"\n",
        "        np.random.seed(self.seed)\n",
        "\n",
        "        N = self.reservoir_size\n",
        "\n",
        "        # Build ring adjacency W_res in shape [N, N], with cycle_weight on ring\n",
        "        W_res = np.zeros((N, N))\n",
        "        for i in range(N):\n",
        "            j = (i+1) % N\n",
        "            W_res[j, i] = self.cycle_weight\n",
        "        self.W_res = W_res  # shared by both sub-reservoirs\n",
        "\n",
        "        # Build cross-connection W_cn for shape [N,N],\n",
        "\n",
        "        W_cn = np.zeros((N, N))\n",
        "\n",
        "        W_cn[0, N-1] = self.connect_weight\n",
        "        if N>1:\n",
        "            # W_cn[1, N-2] = self.connect_weight\n",
        "            W_cn[N-1, 0] = self.connect_weight\n",
        "        self.W_cn = W_cn\n",
        "\n",
        "        self.Win1 = None\n",
        "        self.Win2 = None\n",
        "\n",
        "        # We'll define states x1(t), x2(t).\n",
        "        self.x1 = None\n",
        "        self.x2 = None\n",
        "\n",
        "        self.W_out = None\n",
        "\n",
        "    def _init_substates(self):\n",
        "        \"\"\"\n",
        "        Once we know reservoir_size, we define x1, x2 as zeros.\n",
        "        We'll call this in reset_state or at fit time.\n",
        "        \"\"\"\n",
        "        N = self.reservoir_size\n",
        "        self.x1 = np.zeros(N)\n",
        "        self.x2 = np.zeros(N)\n",
        "\n",
        "    def reset_state(self):\n",
        "        if self.x1 is not None:\n",
        "            self.x1[:] = 0.0\n",
        "        if self.x2 is not None:\n",
        "            self.x2[:] = 0.0\n",
        "\n",
        "    def _update(self, u):\n",
        "        \"\"\"\n",
        "        Single-step reservoir update.\n",
        "        x1(t+1) = cos( Win1*u(t+1) + W_res*x1(t) + W_cn*x2(t) )\n",
        "        x2(t+1) = sin( Win2*u(t+1) + W_res*x2(t) + W_cn*x1(t) )\n",
        "        Then x(t)= h*x1(t+1) + (1-h)* x2(t+1).\n",
        "        We'll define the leaky integration.\n",
        "        \"\"\"\n",
        "        alpha = self.leaking_rate\n",
        "\n",
        "        # pre activation for reservoir1\n",
        "        pre1 = self.Win1 @ u + self.W_res @ self.x1 + self.W_cn @ self.x2\n",
        "        # reservoir1 uses cos\n",
        "        new_x1 = np.cos(pre1)\n",
        "\n",
        "        # reservoir2 uses sin\n",
        "        pre2 = self.Win2 @ u + self.W_res @ self.x2 + self.W_cn @ self.x1\n",
        "        new_x2 = np.sin(pre2)\n",
        "\n",
        "        self.x1 = (1.0 - alpha)*self.x1 + alpha*new_x1\n",
        "        self.x2 = (1.0 - alpha)*self.x2 + alpha*new_x2\n",
        "\n",
        "    def _combine_state(self):\n",
        "        \"\"\"\n",
        "        Combine x1(t), x2(t) => x(t) = h*x1 + (1-h)*x2\n",
        "        \"\"\"\n",
        "        h = self.combine_factor\n",
        "        return h*self.x1 + (1.0 - h)*self.x2\n",
        "\n",
        "    def collect_states(self, inputs, discard=100):\n",
        "        # We reset the reservoir to zero\n",
        "        self.reset_state()\n",
        "        states = []\n",
        "        for t in range(len(inputs)):\n",
        "            self._update(inputs[t])   # feed the REAL input from the dataset\n",
        "            combined = self._combine_state()\n",
        "            states.append(combined.copy())\n",
        "        states = np.array(states)  # shape => [T, N]\n",
        "        return states[discard:], states[:discard]\n",
        "\n",
        "\n",
        "    def fit_readout(self, train_input, train_target, discard=100):\n",
        "        \"\"\"\n",
        "        Build input weights if needed, gather states on the training data (teacher forcing),\n",
        "        then solve a polynomial readout [x, x^2, 1]->train_target(t).\n",
        "\n",
        "        train_input : shape [T, d_in]\n",
        "        train_target: shape [T, d_out]\n",
        "        discard     : # of states to discard for warmup\n",
        "        \"\"\"\n",
        "        T = len(train_input)\n",
        "        if T<2:\n",
        "            raise ValueError(\"Not enough training data\")\n",
        "\n",
        "        d_in = train_input.shape[1]\n",
        "        # d_out = train_target.shape[1]\n",
        "\n",
        "        # built Win1, Win2\n",
        "        if self.Win1 is None or self.Win2 is None:\n",
        "            np.random.seed(self.seed+100)\n",
        "            # build V1, V2 in shape [N, d_in]\n",
        "            N = self.reservoir_size\n",
        "            # V1 = (np.random.rand(N, d_in)-0.5)*2.0*self.input_scale\n",
        "            # V2 = (np.random.rand(N, d_in)-0.5)*2.0*self.input_scale\n",
        "\n",
        "            sign_V1 = np.random.choice([-1, 1], size=(N, d_in))\n",
        "            sign_V2 = np.random.choice([-1, 1], size=(N, d_in))\n",
        "\n",
        "            v1, v2 = self.v1, self.v2  # fixed values for V1, V2\n",
        "\n",
        "            V1 = v1 * sign_V1 * self.input_scale\n",
        "            V2 = v2 * sign_V2 * self.input_scale\n",
        "\n",
        "            # eq(10): Win1= V1 - V2, Win2= V1 + V2\n",
        "            self.Win1 = V1 - V2\n",
        "            self.Win2 = V1 + V2\n",
        "\n",
        "        # define x1, x2\n",
        "        self._init_substates()\n",
        "\n",
        "        # gather states\n",
        "        states_use, _ = self.collect_states(train_input, discard=discard)\n",
        "        target_use = train_target[discard:]  # shape => [T-discard, d_out]\n",
        "\n",
        "        # polynomial readout\n",
        "        X_list = []\n",
        "        for s in states_use:\n",
        "            X_list.append(augment_state_with_squares(s))\n",
        "        X_aug = np.array(X_list)  # shape => [T-discard, 2N+1]\n",
        "\n",
        "        # Solve ridge\n",
        "        reg = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        reg.fit(X_aug, target_use)\n",
        "        # W_out => shape [d_out, 2N+1]\n",
        "        self.W_out = reg.coef_\n",
        "\n",
        "    def predict_autoregressive(self, initial_input, n_steps):\n",
        "        \"\"\"\n",
        "        Fully autoregressive:\n",
        "\n",
        "        \"\"\"\n",
        "        preds = []\n",
        "        # re-init states\n",
        "        #self._init_substates()\n",
        "\n",
        "        # initial_input => shape (d_in,)\n",
        "        current_in = np.array(initial_input)\n",
        "\n",
        "        for _ in range(n_steps):\n",
        "            self._update(current_in)\n",
        "            # read out\n",
        "            combined = self._combine_state()\n",
        "            big_x = augment_state_with_squares(combined)\n",
        "            out = self.W_out @ big_x  # shape => (d_out,)\n",
        "\n",
        "            preds.append(out)\n",
        "            current_in = out  # feed output back as next input\n",
        "\n",
        "        return np.array(preds)\n",
        "\n",
        "    def predict_open_loop(self, test_input):\n",
        "        preds = []\n",
        "        for true_input in test_input:\n",
        "            self._update(true_input)\n",
        "            combined = self._combine_state()\n",
        "            x_aug = augment_state_with_squares(combined)\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "        return np.array(preds)\n"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "2ea2e53a",
      "metadata": {
        "id": "2ea2e53a"
      },
      "source": [
        "### DeepESN"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "3cc3e873",
      "metadata": {
        "id": "3cc3e873"
      },
      "outputs": [],
      "source": [
        "class DeepESN3D:\n",
        "    \"\"\"\n",
        "    Deep Echo State Network (DeepESN) for multi-layered reservoir computing.\n",
        "    Each layer has its own reservoir, and the states are propagated through layers.\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(self,\n",
        "                 num_layers=3,\n",
        "                 reservoir_size=100,\n",
        "                 spectral_radius=0.95,\n",
        "                 connectivity=0.1,\n",
        "                 input_scale=1.0,\n",
        "                 leaking_rate=1.0,\n",
        "                 ridge_alpha=1e-6,\n",
        "                 activation_choices=('tanh','relu','sin','linear'),\n",
        "                 seed=42):\n",
        "        \"\"\"\n",
        "        Parameters:\n",
        "        - num_layers: Number of reservoir layers.\n",
        "        - reservoir_size: Number of neurons in each reservoir layer.\n",
        "        \"\"\"\n",
        "        self.num_layers = num_layers\n",
        "        self.reservoir_size = reservoir_size\n",
        "        self.spectral_radius = spectral_radius\n",
        "        self.connectivity = connectivity\n",
        "        self.input_scale = input_scale\n",
        "        self.leaking_rate = leaking_rate\n",
        "        self.ridge_alpha = ridge_alpha\n",
        "        self.activation_choices = activation_choices\n",
        "        self.seed = seed\n",
        "\n",
        "        # Initialize reservoirs and input weights for each layer\n",
        "        self.reservoirs = []\n",
        "        self.input_weights = []\n",
        "        self.states = []\n",
        "\n",
        "        np.random.seed(self.seed)\n",
        "        for layer in range(num_layers):\n",
        "            np.random.seed(seed + layer)\n",
        "            W = np.random.randn(reservoir_size, reservoir_size) * 0.1\n",
        "            mask = (np.random.rand(reservoir_size, reservoir_size) < self.connectivity)\n",
        "            W = W * mask\n",
        "            W = scale_spectral_radius(W, spectral_radius)\n",
        "            self.reservoirs.append(W)\n",
        "\n",
        "            if layer == 0 :\n",
        "                W_in = (np.random.rand(reservoir_size, 3) - 0.5) * 2.0 * input_scale\n",
        "            else:\n",
        "                W_in = (np.random.rand(reservoir_size, reservoir_size) - 0.5) * 2.0 * input_scale\n",
        "            self.input_weights.append(W_in)\n",
        "\n",
        "        np.random.seed(self.seed + 200)\n",
        "        self.node_activations = np.random.choice(self.activation_choices, size=self.reservoir_size)\n",
        "\n",
        "        self.W_out = None\n",
        "        self.reset_state()\n",
        "\n",
        "    def reset_state(self):\n",
        "        \"\"\"\n",
        "        Reset the states of all reservoir layers.\n",
        "        \"\"\"\n",
        "        self.states = [np.zeros(self.reservoir_size) for _ in range(self.num_layers)]\n",
        "\n",
        "    def _apply_activation(self, act_type, val):\n",
        "        return np.tanh(val)\n",
        "\n",
        "\n",
        "    def _update_layer(self, layer_idx, u):\n",
        "        \"\"\"\n",
        "        Update a single reservoir layer.\n",
        "        \"\"\"\n",
        "        pre_activation = self.reservoirs[layer_idx] @ self.states[layer_idx]\n",
        "        if layer_idx == 0:\n",
        "            pre_activation += self.input_weights[layer_idx] @ u\n",
        "        else:\n",
        "            pre_activation += self.input_weights[layer_idx] @ self.states[layer_idx - 1]\n",
        "\n",
        "        x_new = np.zeros_like(pre_activation)\n",
        "        for i in range(self.reservoir_size):\n",
        "            activation = self.node_activations[i]\n",
        "            x_new[i] = self._apply_activation(activation, pre_activation[i])\n",
        "        alpha = self.leaking_rate\n",
        "        self.states[layer_idx] = (1.0 - alpha) * self.states[layer_idx] + alpha * x_new\n",
        "\n",
        "    def collect_states(self, inputs, discard=100):\n",
        "        self.reset_state()\n",
        "        all_states = []\n",
        "        for u in inputs:\n",
        "            for layer_idx in range(self.num_layers):\n",
        "                self._update_layer(layer_idx, u)\n",
        "            all_states.append(np.concatenate(self.states))\n",
        "        all_states = np.array(all_states)\n",
        "        return all_states[discard:], all_states[:discard]\n",
        "\n",
        "    def fit_readout(self, train_input, train_target, discard=100):\n",
        "        \"\"\"\n",
        "        Train the readout layer using ridge regression.\n",
        "        \"\"\"\n",
        "        states_use, _ = self.collect_states(train_input, discard=discard)\n",
        "        targets_use = train_target[discard:]\n",
        "\n",
        "\n",
        "        X_list = []\n",
        "        for s in states_use:\n",
        "            X_list.append( np.concatenate([s, s**2, [1.0]]) )\n",
        "        X_aug = np.array(X_list)                                    # shape [T-discard, 2N*L+1]\n",
        "\n",
        "        reg = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        reg.fit(X_aug, targets_use)\n",
        "        self.W_out = reg.coef_\n",
        "\n",
        "    def predict_open_loop(self, inputs):\n",
        "        \"\"\"\n",
        "        Single-step-ahead inference on test data.\n",
        "        \"\"\"\n",
        "        preds = []\n",
        "        for u in inputs:\n",
        "            for layer_idx in range(self.num_layers):\n",
        "                self._update_layer(layer_idx, u)\n",
        "            state = np.concatenate(self.states)\n",
        "            x_aug = np.concatenate([state, (state)**2, [1.0]])  \n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "        return np.array(preds)\n",
        "\n",
        "    def predict_autoregressive(self, initial_input, num_steps):\n",
        "        \"\"\"\n",
        "        Autoregressive multi-step forecasting for num_steps\n",
        "        \"\"\"\n",
        "        preds = []\n",
        "        current_input = initial_input.copy()\n",
        "\n",
        "        for _ in range(num_steps):\n",
        "            for layer_idx in range(self.num_layers):\n",
        "                self._update_layer(layer_idx, current_input)\n",
        "            state = np.concatenate(self.states)\n",
        "            x_aug = np.concatenate([state, (state)**2, [1.0]])  \n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "            current_input = out\n",
        "\n",
        "        return np.array(preds)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "6f4741c6",
      "metadata": {
        "id": "6f4741c6"
      },
      "source": [
        "# TRIGR"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "817c595b",
      "metadata": {
        "id": "817c595b"
      },
      "outputs": [],
      "source": [
        "class GliaNeuronTripartiteReservoirESN:\n",
        "    \"\"\"\n",
        "    TRIGR\n",
        "\n",
        "    Fast neuronal core x in R^N bidirectionally coupled to an astrocyte lattice:\n",
        "      • c in R^M : astrocytic (slow, diffusive, saturating)\n",
        "      • g in R^M : gliotransmitter fraction (slow release/recovery)\n",
        "\n",
        "    \"\"\"\n",
        "\n",
        "    # ---------------------- helper (power iteration) ----------------------\n",
        "    @staticmethod\n",
        "    def _opnorm_rect(apply_A, apply_AT, n_in, iters=60, rng=None):\n",
        "        \"\"\"Spectral norm ||A||_2 for a linear map via power iteration on A^T A.\"\"\"\n",
        "        if rng is None:\n",
        "            rng = np.random.default_rng()\n",
        "        v = rng.standard_normal(n_in).astype(np.float32)\n",
        "        v /= (np.linalg.norm(v) + 1e-8)\n",
        "        for _ in range(iters):\n",
        "            v = apply_AT(apply_A(v))\n",
        "            nv = float(np.linalg.norm(v) + 1e-12)\n",
        "            if nv == 0.0:\n",
        "                break\n",
        "            v = (v / nv).astype(np.float32)\n",
        "        Av = apply_A(v)\n",
        "        return float(np.linalg.norm(Av) + 1e-12)\n",
        "\n",
        "    @staticmethod\n",
        "    def _opnorm_matrix(A, iters=60, rng=None):\n",
        "        \"\"\"Spectral norm of numpy array A via power iteration on A^T A.\"\"\"\n",
        "        if rng is None:\n",
        "            rng = np.random.default_rng()\n",
        "        n_in = A.shape[1]\n",
        "        def apply_A(x):  return A @ x\n",
        "        def apply_AT(y): return A.T @ y\n",
        "        return GliaNeuronTripartiteReservoirESN._opnorm_rect(apply_A, apply_AT, n_in, iters=iters, rng=rng)\n",
        "\n",
        "    # -------------------------- constructor --------------------------\n",
        "    def __init__(\n",
        "        self,\n",
        "        # sizes\n",
        "        reservoir_size: int = 800,   # N\n",
        "        input_dim: int = 3,\n",
        "        astro_nx: int = 20,          # M = astro_nx * astro_ny\n",
        "        astro_ny: int = 20,\n",
        "        rel_channels: int = 128,     # P\n",
        "        # kinetics / rates\n",
        "        leak_x: float = 0.25,        # λ\n",
        "        rate_c: float = 0.05,        # α\n",
        "        rate_g: float = 0.05,        # ρ\n",
        "        diff_D: float = 0.5,         # D (will be scaled safely)\n",
        "        # neuron bias\n",
        "        bias: float | np.ndarray = 0.0,  # scalar or length-N\n",
        "        # nonlinearities (F and Γ)\n",
        "        c_max: float = 1.0,          # max Ca\n",
        "        k_c: float = 1.0,            # slope for F (L_F = k_c*c_max/4 ≤ 1 advised)\n",
        "        theta_c: float = 0.0,        # midpoint for F\n",
        "        k_g: float = 0.8,            # slope for Γ (L_Γ = k_g/4 ≤ 1 advised)\n",
        "        theta_g: float = 0.0,        # midpoint for Γ\n",
        "        zeta: float = 0.0,           # tonic drive (scalar)\n",
        "        g_mode: str = \"linear\",      # \"linear\" | \"depletion\"\n",
        "        delta_g: float = 0.2,        # depletion parameter δ ∈ (0,1) if g_mode=\"depletion\"\n",
        "        # input map\n",
        "        input_scale: float = 0.5,\n",
        "        # randomization / sparsity\n",
        "        W_sparsity: float = 0.0,     # fraction of zeros in W_r\n",
        "        footprints_sparsity: float = 0.5,  # sparsity for H before row-norm\n",
        "        block_scale: float = 1.0,    # base std for random blocks\n",
        "        eta_bg: float = 1.0,         # scale in B_g = eta * (H W_rel)^T\n",
        "        # spectral safety targets (row budgets, both <1)\n",
        "        rho_x_target: float = 0.90,  # target for ||W_r|| + ||B_g||\n",
        "        rho_c_target: float = 0.90,  # target for D||L|| + L_F||H W_rel||\n",
        "        # read-out\n",
        "        ridge_alpha: float = 1e-6,\n",
        "        use_poly: bool = True,\n",
        "        feature_mode: str = \"x_c_g\",  # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "        seed: int = 42,\n",
        "    ):\n",
        "        # ---- sanity checks\n",
        "        if reservoir_size < 2:\n",
        "            raise ValueError(\"reservoir_size must be ≥ 2\")\n",
        "        if astro_nx < 1 or astro_ny < 1:\n",
        "            raise ValueError(\"astro grid must be ≥ 1×1\")\n",
        "        if rel_channels < 1:\n",
        "            raise ValueError(\"rel_channels must be ≥ 1\")\n",
        "        if not 0 < leak_x <= 1:\n",
        "            raise ValueError(\"leak_x must be in (0,1]\")\n",
        "        if not 0 < rate_c < 1 or not 0 < rate_g < 1:\n",
        "            raise ValueError(\"rates must be in (0,1)\")\n",
        "        if g_mode not in {\"linear\", \"depletion\"}:\n",
        "            raise ValueError(\"g_mode must be 'linear' or 'depletion'\")\n",
        "        if not (0 <= W_sparsity < 1 and 0 <= footprints_sparsity < 1):\n",
        "            raise ValueError(\"sparsities in [0,1)\")\n",
        "        if feature_mode not in {\"x\", \"x_c_g\", \"x_x2_g\"}:\n",
        "            raise ValueError(\"feature_mode must be 'x', 'x_c_g', or 'x_x2_g'\")\n",
        "\n",
        "        # ---- store\n",
        "        self.N = int(reservoir_size)\n",
        "        self.d_in = int(input_dim)\n",
        "        self.nx = int(astro_nx)\n",
        "        self.ny = int(astro_ny)\n",
        "        self.M = self.nx * self.ny\n",
        "        self.P = int(rel_channels)\n",
        "\n",
        "        self.lam = float(leak_x)\n",
        "        self.alpha = float(rate_c)\n",
        "        self.rho = float(rate_g)\n",
        "        self.D = float(diff_D)\n",
        "\n",
        "        self.c_max = float(c_max)\n",
        "        self.k_c = float(k_c)\n",
        "        self.theta_c = float(theta_c)\n",
        "        self.k_g = float(k_g)\n",
        "        self.theta_g = float(theta_g)\n",
        "        self.zeta_scalar = float(zeta)\n",
        "        self.g_mode = g_mode\n",
        "        self.delta_g = float(delta_g)\n",
        "\n",
        "        self.in_scale = float(input_scale)\n",
        "        self.W_sparsity = float(W_sparsity)\n",
        "        self.fp_sparsity = float(footprints_sparsity)\n",
        "        self.block_scale = float(block_scale)\n",
        "        self.eta_bg = float(eta_bg)\n",
        "\n",
        "        self.rho_x_target = float(rho_x_target)\n",
        "        self.rho_c_target = float(rho_c_target)\n",
        "\n",
        "        self.ridge_alpha = float(ridge_alpha)\n",
        "        self.use_poly = bool(use_poly)\n",
        "        self.feature_mode = feature_mode\n",
        "        self.seed = int(seed)\n",
        "\n",
        "        rng = np.random.default_rng(self.seed)\n",
        "\n",
        "        # ---- neuron bias b\n",
        "        if np.isscalar(bias):\n",
        "            self.b = np.full(self.N, float(bias), dtype=np.float32)\n",
        "        else:\n",
        "            b = np.asarray(bias, dtype=np.float32).reshape(-1)\n",
        "            if b.size != self.N:\n",
        "                raise ValueError(\"bias must be scalar or length-N\")\n",
        "            self.b = b\n",
        "\n",
        "        # ---- 5-point stencil Laplacian (combinatorial)\n",
        "        def laplacian_apply(vec):\n",
        "            c = vec.reshape(self.ny, self.nx)\n",
        "            up    = np.pad(c[:-1, :],  ((1,0),(0,0)))\n",
        "            down  = np.pad(c[1:,  :],  ((0,1),(0,0)))\n",
        "            left  = np.pad(c[:, :-1],  ((0,0),(1,0)))\n",
        "            right = np.pad(c[:, 1:],   ((0,0),(0,1)))\n",
        "            neigh_sum = up + down + left + right\n",
        "            deg = np.full_like(c, 4.0)\n",
        "            deg[0, :] -= 1.0; deg[-1, :] -= 1.0; deg[:, 0] -= 1.0; deg[:, -1] -= 1.0\n",
        "            out = deg * c - neigh_sum\n",
        "            return out.reshape(-1).astype(np.float32)\n",
        "        self._laplacian_apply = laplacian_apply\n",
        "\n",
        "        # ---- random maps\n",
        "        # W_r: N×N\n",
        "        W_r = rng.standard_normal((self.N, self.N)).astype(np.float32) * self.block_scale\n",
        "        if self.W_sparsity > 0:\n",
        "            mask = (rng.random((self.N, self.N)) > self.W_sparsity).astype(np.float32)\n",
        "            W_r *= mask\n",
        "        self.W_r = W_r\n",
        "\n",
        "        # W_in: N×d_in\n",
        "        self.W_in = (rng.uniform(-1.0, 1.0, size=(self.N, self.d_in)) * self.in_scale).astype(np.float32)\n",
        "\n",
        "        # W_rel: P×N\n",
        "        self.W_rel = (rng.standard_normal((self.P, self.N)).astype(np.float32) * self.block_scale)\n",
        "\n",
        "        # H: M×P nonnegative sparse-ish with row-normalization\n",
        "        H = rng.random((self.M, self.P)).astype(np.float32) * self.block_scale\n",
        "        if self.fp_sparsity > 0:\n",
        "            mask = (rng.random((self.M, self.P)) > self.fp_sparsity).astype(np.float32)\n",
        "            H *= mask\n",
        "        H = H / (H.sum(axis=1, keepdims=True) + 1e-8)  # row-normalize (keep rows nonzero)\n",
        "        self.H = H.astype(np.float32)\n",
        "\n",
        "        # ----------------- estimate ||H W_rel|| and ||L|| -----------------\n",
        "        def apply_A(x):   # x ∈ R^N → R^M\n",
        "            return (self.H @ (self.W_rel @ x)).astype(np.float32)\n",
        "        def apply_AT(y):  # y ∈ R^M → R^N\n",
        "            return (self.W_rel.T @ (self.H.T @ y)).astype(np.float32)\n",
        "        nHW = self._opnorm_rect(apply_A, apply_AT, n_in=self.N, iters=60, rng=rng)\n",
        "\n",
        "        def opnorm_L(iters=60):\n",
        "            v = rng.standard_normal(self.M).astype(np.float32)\n",
        "            v /= (np.linalg.norm(v) + 1e-8)\n",
        "            for _ in range(iters):\n",
        "                w = self._laplacian_apply(v)\n",
        "                nw = float(np.linalg.norm(w) + 1e-12)\n",
        "                if nw == 0.0:\n",
        "                    break\n",
        "                v = (w / nw).astype(np.float32)\n",
        "            return float(np.linalg.norm(self._laplacian_apply(v)) + 1e-12)\n",
        "        nL = opnorm_L(iters=60)\n",
        "\n",
        "        L_F = (self.k_c * self.c_max) / 4.0  # max slope of logistic * c_max\n",
        "\n",
        "        # ----------------- Ca-row scaling: scale BOTH D and H -----------------\n",
        "        denom_c = self.D * nL + L_F * nHW + 1e-8\n",
        "        s_c = self.rho_c_target / denom_c\n",
        "        self.D *= s_c\n",
        "        self.H *= s_c  # affects A = H W_rel\n",
        "\n",
        "        # ----------------- build B_g AFTER H-scaling -----------------\n",
        "        # B_g = eta * (H W_rel)^T ∈ R^{N×M} aligns astro→neuron footprint with neuron→astro map\n",
        "        HW = (self.H @ self.W_rel)           # M×N\n",
        "        self.B_g = (self.eta_bg * HW.T).astype(np.float32)  # N×M\n",
        "\n",
        "        # ----------------- neuron row scaling: ||W_r|| + ||B_g|| ≤ rho_x_target -----------------\n",
        "        nWr = self._opnorm_matrix(self.W_r, iters=60, rng=rng)\n",
        "        nBg = self._opnorm_matrix(self.B_g, iters=60, rng=rng)\n",
        "        s_x = self.rho_x_target / (nWr + nBg + 1e-8)\n",
        "        self.W_r *= s_x\n",
        "        self.B_g *= s_x\n",
        "\n",
        "        # ---------- runtime state (x, c, g) ----------\n",
        "        self.x = np.zeros(self.N, dtype=np.float32)\n",
        "        self.c = np.zeros(self.M, dtype=np.float32)\n",
        "        self.g = np.zeros(self.M, dtype=np.float32)\n",
        "\n",
        "        # read-out\n",
        "        self.W_out: np.ndarray | None = None\n",
        "\n",
        "    # -------------------- nonlinearities --------------------\n",
        "    def _F(self, z: np.ndarray) -> np.ndarray:\n",
        "        s = 1.0 / (1.0 + np.exp(-self.k_c * (z - self.theta_c)))\n",
        "        return (self.c_max * s).astype(np.float32)\n",
        "\n",
        "    def _Gamma(self, c: np.ndarray) -> np.ndarray:\n",
        "        s = 1.0 / (1.0 + np.exp(-self.k_g * (c - self.theta_g)))\n",
        "        return s.astype(np.float32)\n",
        "\n",
        "    # -------------------- one simulation step --------------------\n",
        "    def _step(self, u_t: np.ndarray):\n",
        "        \"\"\"\n",
        "        One NA-LESN step with input u_t (shape [d_in]).\n",
        "        Cross-couplings use one-step delays:\n",
        "          x_t uses g_{t-1}; c_t uses x_{t-1}; g_t uses c_{t-1}.\n",
        "        \"\"\"\n",
        "        x_prev = self.x\n",
        "        c_prev = self.c\n",
        "        g_prev = self.g\n",
        "\n",
        "        # --- neurons (tanh with leak and bias)\n",
        "        pre = (self.W_r @ x_prev) + (self.W_in @ u_t) + (self.B_g @ g_prev) + self.b\n",
        "        x_new = (1.0 - self.lam) * x_prev + self.lam * np.tanh(pre).astype(np.float32)\n",
        "\n",
        "        # --- glutamate proxy and pooling (uses x_{t-1})\n",
        "        q = np.maximum(self.W_rel @ x_prev, 0.0).astype(np.float32)     # ReLU\n",
        "        drive = (self.H @ q).astype(np.float32)\n",
        "\n",
        "        # --- astro Ca²⁺ with 5-point stencil Laplacian\n",
        "        Fc = self._F(drive)\n",
        "        Lc_prev = self._laplacian_apply(c_prev)\n",
        "        c_new = (1.0 - self.alpha) * c_prev + self.alpha * (Fc + self.D * Lc_prev + self.zeta_scalar)\n",
        "\n",
        "        # --- gliotransmitter (uses c_{t-1})\n",
        "        if self.g_mode == \"linear\":\n",
        "            g_target = self._Gamma(c_prev)\n",
        "            g_new = (1.0 - self.rho) * g_prev + self.rho * g_target\n",
        "        else:  # depletion\n",
        "            g_prod = self._Gamma(c_prev)\n",
        "            g_new = g_prev + self.rho * (g_prod * (1.0 - g_prev) - self.delta_g * g_prev)\n",
        "        g_new = np.clip(g_new, 0.0, 1.0).astype(np.float32)\n",
        "\n",
        "        self.x, self.c, self.g = x_new, c_new.astype(np.float32), g_new\n",
        "\n",
        "    # -------------------- features --------------------\n",
        "    def _features_from_state(self) -> np.ndarray:\n",
        "        if self.feature_mode == \"x\":\n",
        "            feat = self.x\n",
        "        elif self.feature_mode == \"x_c_g\":\n",
        "            feat = np.concatenate([self.x, self.c, self.g], axis=0)\n",
        "        else:  # 'x_x2_g': [x ; x^2 ; g]\n",
        "            feat = np.concatenate([self.x, self.x * self.x, self.g], axis=0)\n",
        "\n",
        "        # Optional polynomial lift (except when we already added x^2 explicitly)\n",
        "        if self.use_poly and self.feature_mode != \"x_x2_g\":\n",
        "            feat = np.concatenate([feat, feat * feat], axis=0)\n",
        "\n",
        "        # Always append constant for intercept\n",
        "        feat = np.concatenate([feat, [1.0]], axis=0)\n",
        "        return feat.astype(np.float32)\n",
        "\n",
        "    # -------------------- API: reset / train / predict --------------------\n",
        "    def reset_state(self):\n",
        "        self.x.fill(0.0)\n",
        "        self.c.fill(0.0)\n",
        "        self.g.fill(0.0)\n",
        "\n",
        "    def fit_readout(self, inputs: np.ndarray, targets: np.ndarray, discard: int = 100):\n",
        "        \"\"\"\n",
        "        Teacher-forced ridge regression for the read-out.\n",
        "        inputs  : [T, d_in]\n",
        "        targets : [T, d_out]\n",
        "        \"\"\"\n",
        "        inputs = np.asarray(inputs, dtype=np.float32)\n",
        "        targets = np.asarray(targets, dtype=np.float32)\n",
        "        T, d_in = inputs.shape\n",
        "        if d_in != self.d_in:\n",
        "            raise ValueError(\"input_dim mismatch\")\n",
        "        if T <= discard:\n",
        "            raise ValueError(\"sequence too short for discard period\")\n",
        "\n",
        "        #self.reset_state()\n",
        "        feats = []\n",
        "        for t in range(T):\n",
        "            self._step(inputs[t])\n",
        "            if t >= discard:\n",
        "                feats.append(self._features_from_state())\n",
        "        X = np.asarray(feats, dtype=np.float32)     # [T-d, F]\n",
        "        Y = targets[discard:]                       # [T-d, d_out]\n",
        "\n",
        "        reg = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        reg.fit(X, Y)\n",
        "        self.W_out = reg.coef_.astype(np.float32)\n",
        "\n",
        "    def predict_autoregressive(self, init_input: np.ndarray, n_steps: int) -> np.ndarray:\n",
        "        \"\"\"\n",
        "        Closed-loop prediction (feedback first d_in outputs).\n",
        "        \"\"\"\n",
        "        if self.W_out is None:\n",
        "            raise RuntimeError(\"Call fit_readout() before prediction\")\n",
        "        d_out = self.W_out.shape[0]\n",
        "        preds = np.empty((n_steps, d_out), dtype=np.float32)\n",
        "\n",
        "        #self.reset_state()\n",
        "        current_u = np.asarray(init_input, dtype=np.float32).copy()\n",
        "        for t in range(n_steps):\n",
        "            self._step(current_u)\n",
        "            feat = self._features_from_state()\n",
        "            y_t = (self.W_out @ feat).astype(np.float32)\n",
        "            preds[t] = y_t\n",
        "            current_u = y_t[: self.d_in]\n",
        "        return preds\n",
        "\n",
        "    def predict_open_loop(self, test_input: np.ndarray) -> np.ndarray:\n",
        "        \"\"\"\n",
        "        Open-loop (teacher-forced) prediction over a provided input sequence.\n",
        "        test_input : [T, d_in] → returns [T, d_out]\n",
        "        \"\"\"\n",
        "        if self.W_out is None:\n",
        "            raise RuntimeError(\"Call fit_readout() before prediction\")\n",
        "        test_input = np.asarray(test_input, dtype=np.float32)\n",
        "        if test_input.ndim != 2 or test_input.shape[1] != self.d_in:\n",
        "            raise ValueError(f\"test_input must have shape [T, {self.d_in}]\")\n",
        "\n",
        "        T = test_input.shape[0]\n",
        "        d_out = self.W_out.shape[0]\n",
        "        preds = np.empty((T, d_out), dtype=np.float32)\n",
        "\n",
        "        #self.reset_state()\n",
        "        for t in range(T):\n",
        "            self._step(test_input[t])\n",
        "            feat = self._features_from_state()\n",
        "            preds[t] = (self.W_out @ feat).astype(np.float32)\n",
        "        return preds\n",
        "\n",
        "    # -------------------- quick ESP checks (optional) --------------------\n",
        "    def estimate_row_bounds(self, iters: int = 50, rng=None):\n",
        "        \"\"\"\n",
        "        Rough estimates for the three row sums in the ESP certificate:\n",
        "          neuron_row ≈ (1−λ) + λ ( ||W_r|| + ||B_g|| )\n",
        "          ca_row     ≈ (1−α) + α ( D ||L|| + L_F ||H W_rel|| )\n",
        "          glio_row   ≈ (1−ρ) + ρ L_Γ  (or ≤ 1 − ρδ + ρ L_Γ for depletion)\n",
        "        \"\"\"\n",
        "        if rng is None:\n",
        "            rng = np.random.default_rng(self.seed + 7)\n",
        "\n",
        "        nWr = self._opnorm_matrix(self.W_r, iters=iters, rng=rng)\n",
        "        nBg = self._opnorm_matrix(self.B_g, iters=iters, rng=rng)\n",
        "\n",
        "        def apply_A(x):   return (self.H @ (self.W_rel @ x)).astype(np.float32)\n",
        "        def apply_AT(y):  return (self.W_rel.T @ (self.H.T @ y)).astype(np.float32)\n",
        "        nHW = self._opnorm_rect(apply_A, apply_AT, n_in=self.N, iters=iters, rng=rng)\n",
        "\n",
        "        def opnorm_L():\n",
        "            v = rng.standard_normal(self.M).astype(np.float32)\n",
        "            v /= (np.linalg.norm(v) + 1e-8)\n",
        "            for _ in range(iters):\n",
        "                w = self._laplacian_apply(v)\n",
        "                nw = float(np.linalg.norm(w) + 1e-12)\n",
        "                if nw == 0.0:\n",
        "                    break\n",
        "                v = (w / nw).astype(np.float32)\n",
        "            return float(np.linalg.norm(self._laplacian_apply(v)) + 1e-12)\n",
        "        nL = opnorm_L()\n",
        "\n",
        "        L_F = (self.k_c * self.c_max) / 4.0\n",
        "        L_G = (self.k_g) / 4.0\n",
        "\n",
        "        neuron_row = (1.0 - self.lam) + self.lam * (nWr + nBg)\n",
        "        ca_row     = (1.0 - self.alpha) + self.alpha * (self.D * nL + L_F * nHW)\n",
        "        glio_row   = (1.0 - self.rho) + self.rho * L_G if self.g_mode == \"linear\" \\\n",
        "                     else (1.0 - self.rho * self.delta_g) + self.rho * L_G\n",
        "\n",
        "        return dict(neuron_row=neuron_row, ca_row=ca_row, glio_row=glio_row)\n"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "20030a3f",
      "metadata": {
        "id": "20030a3f"
      },
      "source": [
        "# Datasets"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "aaba2430",
      "metadata": {
        "id": "aaba2430"
      },
      "source": [
        "### Lorenz System Data Generation"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "cd0e7586",
      "metadata": {
        "id": "cd0e7586"
      },
      "outputs": [],
      "source": [
        "def lorenz_derivatives(state, t, sigma=10.0, rho=28.0, beta=8.0/3.0):\n",
        "    \"\"\"Compute time derivatives [dx/dt, dy/dt, dz/dt] for the Lorenz system.\"\"\"\n",
        "    x, y, z = state\n",
        "    dxdt = sigma * (y - x)\n",
        "    dydt = x * (rho - z) - y\n",
        "    dzdt = x * y - beta * z\n",
        "    return [dxdt, dydt, dzdt]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "7c35a92e",
      "metadata": {
        "id": "7c35a92e"
      },
      "outputs": [],
      "source": [
        "def generate_lorenz_data(\n",
        "    initial_state=[1.0, 1.0, 1.0],\n",
        "    tmax=25.0,\n",
        "    dt=0.01,\n",
        "    sigma=10.0,\n",
        "    rho=28.0,\n",
        "    beta=8.0/3.0\n",
        "):\n",
        "    \"\"\"\n",
        "    Numerically integrate Lorenz equations x'(t), y'(t), z'(t) using odeint.\n",
        "    Returns:\n",
        "       t_vals: array of time points\n",
        "       sol   : array shape [num_steps, 3] of [x(t), y(t), z(t)]\n",
        "    \"\"\"\n",
        "    num_steps = int(tmax / dt)\n",
        "    t_vals = np.linspace(0, tmax, num_steps)\n",
        "    sol = odeint(lorenz_derivatives, initial_state, t_vals, args=(sigma, rho, beta))\n",
        "    return t_vals, sol"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "50325aa7",
      "metadata": {
        "id": "50325aa7"
      },
      "source": [
        "### Rossler System Data Generation"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "6e24b363",
      "metadata": {
        "id": "6e24b363"
      },
      "outputs": [],
      "source": [
        "def rossler_derivatives(state, t, a=0.2, b=0.2, c=5.7):\n",
        "    \"\"\"Compute time derivatives [dx/dt, dy/dt, dz/dt] for the Rössler system.\"\"\"\n",
        "    x, y, z = state\n",
        "    dxdt = -y - z\n",
        "    dydt = x + a * y\n",
        "    dzdt = b + z * (x - c)\n",
        "    return [dxdt, dydt, dzdt]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "e71b9eb9",
      "metadata": {
        "id": "e71b9eb9"
      },
      "outputs": [],
      "source": [
        "def generate_rossler_data(\n",
        "    initial_state=[1.0, 0.0, 0.0],\n",
        "    tmax=25.0,\n",
        "    dt=0.01,\n",
        "    a=0.2,\n",
        "    b=0.2,\n",
        "    c=5.7\n",
        "):\n",
        "    \"\"\"\n",
        "    Numerically integrate Rössler equations x'(t), y'(t), z'(t) using odeint.\n",
        "    Returns:\n",
        "       t_vals: array of time points\n",
        "       sol   : array shape [num_steps, 3] of [x(t), y(t), z(t)]\n",
        "    \"\"\"\n",
        "    num_steps = int(tmax / dt)\n",
        "    t_vals = np.linspace(0, tmax, num_steps)\n",
        "    sol = odeint(rossler_derivatives, initial_state, t_vals, args=(a, b, c))\n",
        "    return t_vals, sol"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "8fe02d06",
      "metadata": {
        "id": "8fe02d06"
      },
      "source": [
        "### Chen System Data Generation"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a646dd5f",
      "metadata": {
        "id": "a646dd5f"
      },
      "outputs": [],
      "source": [
        "def chen_derivatives(state, t, a=35.0, b=3.0, c=28.0):\n",
        "    \"\"\"\n",
        "    Computes time derivatives [dx/dt, dy/dt, dz/dt] for the Chen system.\n",
        "    \"\"\"\n",
        "    x, y, z = state\n",
        "    dxdt = a*(y - x)\n",
        "    dydt = (c - a)*x + c*y - x*z\n",
        "    dzdt = x*y - b*z\n",
        "    return [dxdt, dydt, dzdt]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "42733740",
      "metadata": {
        "id": "42733740"
      },
      "outputs": [],
      "source": [
        "def generate_chen_data(\n",
        "    initial_state=[1.0, 1.0, 1.0],\n",
        "    tmax=50.0,\n",
        "    dt=0.01,\n",
        "    a=35.0,\n",
        "    b=3.0,\n",
        "    c=28.0\n",
        "):\n",
        "    \"\"\"\n",
        "    Numerically integrate Chen equations x'(t), y'(t), z'(t) using odeint.\n",
        "    Returns:\n",
        "       t_vals: array of time points\n",
        "       sol   : array shape [num_steps, 3] of [x(t), y(t), z(t)]\n",
        "    \"\"\"\n",
        "    num_steps = int(tmax / dt)\n",
        "    t_vals = np.linspace(0, tmax, num_steps)\n",
        "    sol = odeint(chen_derivatives, initial_state, t_vals, args=(a, b, c))\n",
        "    return t_vals, sol"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "2a3f44de",
      "metadata": {
        "id": "2a3f44de"
      },
      "source": [
        "# Metrics"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "587f6038",
      "metadata": {
        "id": "587f6038"
      },
      "source": [
        "### NRMSE"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "b55e0383",
      "metadata": {
        "id": "b55e0383"
      },
      "outputs": [],
      "source": [
        "def evaluate_nrmse(all_preds, test_target, horizons):\n",
        "    \"\"\"\n",
        "    Evaluate model performance over multiple prediction horizons\n",
        "    for teacher-forced single-step forecasting or autoregressive rollout.\n",
        "    \"\"\"\n",
        "    horizon_nrmse = {}\n",
        "    for horizon in horizons:\n",
        "        preds = all_preds[:horizon]\n",
        "        targets = test_target[:horizon]\n",
        "        squared_errors = (preds - targets) ** 2\n",
        "        variance = np.var(targets, axis=0)\n",
        "        variance[variance == 0] = 1e-8  # avoid divide-by-zero\n",
        "        nrmse = np.sqrt(np.sum(squared_errors) / (horizon * np.sum(variance)))\n",
        "        horizon_nrmse[horizon] = nrmse\n",
        "    return horizon_nrmse"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "feb9a21c",
      "metadata": {
        "id": "feb9a21c"
      },
      "source": [
        "### Dimensionless Predictive Horizon"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "193a03f4",
      "metadata": {
        "id": "193a03f4"
      },
      "outputs": [],
      "source": [
        "def compute_valid_prediction_time(y_true, y_pred, t_vals, lyupanov_time, threshold, dt=0.2):\n",
        "    \"\"\"\n",
        "    Compute the Valid Prediction Time (VPT) and compare it to Lyapunov time.\n",
        "\n",
        "    Parameters\n",
        "    ----------\n",
        "    y_true : ndarray of shape (N, dim)\n",
        "        True trajectory over time.\n",
        "    y_pred : ndarray of shape (N, dim)\n",
        "        Model's predicted trajectory over time (closed-loop).\n",
        "    t_vals : ndarray of shape (N,)\n",
        "        Time values corresponding to the trajectory steps.\n",
        "    threshold : float\n",
        "        The error threshold, default is 0.4 as in your snippet.\n",
        "    lyupanov_time : float\n",
        "        1/Largest Lyapunov exponent.\n",
        "\n",
        "    Returns\n",
        "    -------\n",
        "    T_VPT : float\n",
        "        Valid prediction time. The earliest time at which normalized error surpasses threshold\n",
        "        (or the last time if never surpassed).\n",
        "    ratio : float\n",
        "        How many Lyapunov times the model prediction remains valid, i.e. T_VPT / T_lambda.\n",
        "    \"\"\"\n",
        "    # Average of y_true\n",
        "    y_mean = np.mean(y_true, axis=0)  # shape (dim,)\n",
        "\n",
        "    #  Time-averaged norm^2 of (y_true - y_mean)\n",
        "    y_centered = y_true - y_mean\n",
        "    denom = np.mean(np.sum(y_centered**2, axis=1))  # scalar\n",
        "\n",
        "    # Compute the normalized error delta_gamma(t) = ||y_true - y_pred||^2 / denom\n",
        "    diff = y_true - y_pred\n",
        "    err_sq = np.sum(diff**2, axis=1)  # shape (N,)\n",
        "    delta_gamma = err_sq / denom      # shape (N,)\n",
        "\n",
        "    #  Find the first time index where delta_gamma(t) exceeds threshold\n",
        "    idx_exceed = np.where(delta_gamma > threshold)[0]\n",
        "    if len(idx_exceed) == 0:\n",
        "        # never exceeds threshold => set T_VPT to the final time\n",
        "        T_VPT = t_vals[-1]\n",
        "    else:\n",
        "        T_VPT = t_vals[idx_exceed[0]]\n",
        "\n",
        "    # Compute T_lambda and ratio\n",
        "    T_lambda = lyupanov_time\n",
        "\n",
        "    # print(f\"\\n--- Valid Prediction Time (VPT) with threshold={threshold}, lambda_max={lambda_max} ---\")\n",
        "\n",
        "    T_VPT = (T_VPT - t_vals[0])  # Adjust T_VPT to be relative to the start time\n",
        "    ratio = T_VPT / T_lambda\n",
        "\n",
        "    return T_VPT, ratio"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "5e4e8e78",
      "metadata": {
        "id": "5e4e8e78"
      },
      "source": [
        "### Attractor Geometry Deviation"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "38f84534",
      "metadata": {
        "id": "38f84534"
      },
      "outputs": [],
      "source": [
        "def compute_attractor_deviation(predictions, targets, cube_size=(0.1, 0.1, 0.1)):\n",
        "    \"\"\"\n",
        "    Compute the Attractor Deviation (ADev) metric.\n",
        "\n",
        "    Parameters:\n",
        "        predictions (numpy.ndarray): Predicted trajectories of shape (n, 3).\n",
        "        targets (numpy.ndarray): True trajectories of shape (n, 3).\n",
        "        cube_size (tuple): Dimensions of the cube (dx, dy, dz).\n",
        "\n",
        "    Returns:\n",
        "        float: The ADev metric.\n",
        "    \"\"\"\n",
        "    # Define the cube grid based on the range of the data and cube size\n",
        "    min_coords = np.min(np.vstack((predictions, targets)), axis=0)\n",
        "    max_coords = np.max(np.vstack((predictions, targets)), axis=0)\n",
        "\n",
        "    # Create a grid of cubes\n",
        "    grid_shape = ((max_coords - min_coords) / cube_size).astype(int) + 1\n",
        "\n",
        "    # Initialize the cube occupancy arrays\n",
        "    pred_cubes = np.zeros(grid_shape, dtype=int)\n",
        "    target_cubes = np.zeros(grid_shape, dtype=int)\n",
        "\n",
        "    # Map trajectories to cubes\n",
        "    pred_indices = ((predictions - min_coords) / cube_size).astype(int)\n",
        "    target_indices = ((targets - min_coords) / cube_size).astype(int)\n",
        "\n",
        "    # Mark cubes visited by predictions and targets\n",
        "    for idx in pred_indices:\n",
        "        pred_cubes[tuple(idx)] = 1\n",
        "    for idx in target_indices:\n",
        "        target_cubes[tuple(idx)] = 1\n",
        "\n",
        "    # Compute the ADev metric\n",
        "    adev = np.sum(np.abs(pred_cubes - target_cubes))\n",
        "    return adev"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "825c2de7",
      "metadata": {
        "id": "825c2de7"
      },
      "source": [
        "### PSD"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "402a5c32",
      "metadata": {
        "id": "402a5c32"
      },
      "outputs": [],
      "source": [
        "def compute_psd(y, dt=0.01):\n",
        "    z = y[:, 2]  # Extract Z-component\n",
        "\n",
        "    # Compute PSD using Welch’s method\n",
        "    freqs, psd = welch(z, fs=1/dt, window='hamming', nperseg=len(z))  # Using Hamming window\n",
        "\n",
        "    return freqs, psd"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "bfe5b4c4",
      "metadata": {
        "id": "bfe5b4c4"
      },
      "source": [
        "# Dataset Preparation"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "627c7a40",
      "metadata": {
        "id": "627c7a40"
      },
      "source": [
        "### Lorenz System"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "d7b1b30f",
      "metadata": {
        "id": "d7b1b30f"
      },
      "outputs": [],
      "source": [
        "tmax = 250.0\n",
        "dt = 0.02\n",
        "lorenz_t_vals, lorenz_trajectory = generate_lorenz_data(\n",
        "    initial_state=[1.0, 1.0, 1.0],\n",
        "    tmax=tmax,\n",
        "    dt=dt,\n",
        "    sigma=10.0,\n",
        "    rho=28.0,\n",
        "    beta=8.0/3.0\n",
        ")\n",
        "\n",
        "# Discard first 2,000 points as washout\n",
        "washout = 2000\n",
        "lorenz_t_vals = lorenz_t_vals[washout:]\n",
        "lorenz_trajectory = lorenz_trajectory[washout:]\n",
        "\n",
        "scaler = MinMaxScaler()\n",
        "scaler.fit(lorenz_trajectory)\n",
        "lorenz_traj = scaler.transform(lorenz_trajectory)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "8396e37d",
      "metadata": {},
      "outputs": [],
      "source": [
        "fig = plt.figure(figsize=(10, 5))\n",
        "ax = fig.add_subplot(projection='3d')\n",
        "\n",
        "colors = cm.twilight(np.linspace(0, 1, len(lorenz_trajectory)))\n",
        "\n",
        "for i in range(len(lorenz_trajectory) - 1):\n",
        "    ax.plot(lorenz_trajectory[i:i+2, 0], lorenz_trajectory[i:i+2, 1], lorenz_trajectory[i:i+2, 2],\n",
        "            color=colors[i], linewidth=1.2, alpha=0.9)\n",
        "\n",
        "ax.grid(True)\n",
        "\n",
        "ax.tick_params(axis='x', colors='none')\n",
        "ax.tick_params(axis='y', colors='none')\n",
        "ax.tick_params(axis='z', colors='none')\n",
        "plt.savefig(\"Figures/Lorenz Attractor.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "41c79970",
      "metadata": {},
      "outputs": [],
      "source": [
        "sns.set(style=\"whitegrid\")\n",
        "\n",
        "t = np.linspace(0, len(lorenz_trajectory), len(lorenz_trajectory))\n",
        "\n",
        "fig, axes = plt.subplots(3, 1, figsize=(14, 10), sharex=True)\n",
        "\n",
        "dims = ['x(t)', 'y(t)', 'z(t)']\n",
        "line_labels = ['True', 'TRIGR']\n",
        "line_styles = ['--', '-']\n",
        "line_colors = ['#2c3e94', '#e25822']\n",
        "\n",
        "for i in range(3):\n",
        "    axes[i].plot(t, lorenz_trajectory[:, i], label=line_labels[0], linewidth=2.5, color=line_colors[0])\n",
        "    axes[i].set_ylabel(dims[i], fontsize=13)\n",
        "    # Hide tick labels (units) on x and y axes\n",
        "    axes[i].set_xticklabels([])\n",
        "    axes[i].set_yticklabels([])\n",
        "\n",
        "    # keep tick marks but adjust size if needed\n",
        "    axes[i].tick_params(axis='both', which='major', labelsize=0)\n",
        "\n",
        "    axes[i].grid(True, linestyle='--', linewidth=0.6, alpha=0.3)  \n",
        "\n",
        "plt.tight_layout(rect=[0, 0.03, 1, 0.95])\n",
        "plt.savefig(\"Figures/Trajectories for Train Segment.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "9bcffe6c",
      "metadata": {
        "id": "9bcffe6c"
      },
      "outputs": [],
      "source": [
        "# Prepare single-step data: input(t) = [x(t), y(t), z(t)], target(t)=[x(t+1), y(t+1), z(t+1)]\n",
        "inputs = lorenz_trajectory[:-1]\n",
        "targets = lorenz_trajectory[1:]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "cc0988de",
      "metadata": {},
      "outputs": [],
      "source": [
        "train_frac = 0.7\n",
        "data_size = len(lorenz_trajectory)-1\n",
        "train_size = int(train_frac * (data_size - 1))\n",
        "train_input = inputs[:train_size]\n",
        "train_target = targets[1:train_size+1]\n",
        "test_input = inputs[train_size:-1]\n",
        "test_target = targets[train_size+1:]\n",
        "test_size = len(test_input)\n",
        "print(f\"Total samples: {data_size}, train size: {train_size}, test size: {test_size}\")"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "2f5f95aa",
      "metadata": {
        "id": "2f5f95aa"
      },
      "source": [
        "### Rossler System"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "51b8c9a4",
      "metadata": {
        "id": "51b8c9a4"
      },
      "outputs": [],
      "source": [
        "tmax = 250.0\n",
        "dt = 0.02\n",
        "rossler_t_vals, rossler_trajectory = generate_rossler_data(\n",
        "    initial_state=[1.0, 0.0, 0.0],\n",
        "    tmax=tmax,\n",
        "    dt=dt,\n",
        "    a=0.2,\n",
        "    b=0.2,\n",
        "    c=5.7\n",
        ")\n",
        "\n",
        "# Discard first 2,000 points as washout\n",
        "washout = 2000\n",
        "rossler_t_vals = rossler_t_vals[washout:]\n",
        "rossler_trajectory = rossler_trajectory[washout:]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "3662744c",
      "metadata": {},
      "outputs": [],
      "source": [
        "fig = plt.figure(figsize=(10, 5))\n",
        "ax = fig.add_subplot(projection='3d')\n",
        "\n",
        "colors = cm.twilight(np.linspace(0, 1, len(rossler_trajectory)))\n",
        "\n",
        "for i in range(len(rossler_trajectory) - 1):\n",
        "    ax.plot(rossler_trajectory[i:i+2, 0], rossler_trajectory[i:i+2, 1], rossler_trajectory[i:i+2, 2],\n",
        "            color=colors[i], linewidth=1.2, alpha=0.9)\n",
        "\n",
        "ax.grid(True)\n",
        "\n",
        "ax.tick_params(axis='x', colors='none')\n",
        "ax.tick_params(axis='y', colors='none')\n",
        "ax.tick_params(axis='z', colors='none')\n",
        "\n",
        "plt.savefig(\"Figures/Rossler Attractor.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a00176e8",
      "metadata": {},
      "outputs": [],
      "source": [
        "t = np.linspace(0, len(rossler_trajectory), len(rossler_trajectory))\n",
        "\n",
        "plt.figure(figsize=(10, 5))\n",
        "plt.plot(t, rossler_trajectory[:, 0], label='x(t)', color='r', lw=0.8)\n",
        "plt.plot(t, rossler_trajectory[:, 1], label='y(t)', color='g', lw=0.8)\n",
        "plt.plot(t, rossler_trajectory[:, 2], label='z(t)', color='b', lw=0.8)\n",
        "\n",
        "plt.title(\"Time Series of Rossler System\")\n",
        "plt.legend()\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "df5c4db1",
      "metadata": {
        "id": "df5c4db1"
      },
      "outputs": [],
      "source": [
        "# Prepare single-step data: input(t) = [x(t), y(t), z(t)], target(t)=[x(t+1), y(t+1), z(t+1)]\n",
        "inputs = rossler_trajectory[:-1]\n",
        "targets = rossler_trajectory[1:]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "175ae0d4",
      "metadata": {},
      "outputs": [],
      "source": [
        "train_frac = 0.3\n",
        "data_size = len(rossler_trajectory)-1\n",
        "train_size = int(train_frac * (data_size - 1))\n",
        "train_input = inputs[:train_size]\n",
        "train_target = targets[1:train_size+1]\n",
        "test_input = inputs[train_size:-1]\n",
        "test_target = targets[train_size+1:]\n",
        "test_size = len(test_input)\n",
        "print(f\"Total samples: {data_size}, train size: {train_size}, test size: {test_size}\")"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "b0e48e4c",
      "metadata": {
        "id": "b0e48e4c"
      },
      "source": [
        "### Chen System"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a885e570",
      "metadata": {
        "id": "a885e570"
      },
      "outputs": [],
      "source": [
        "tmax = 250.0\n",
        "dt = 0.02\n",
        "chen_t_vals, chen_trajectory = generate_chen_data(\n",
        "    initial_state=[1.0, 1.0, 1.0],\n",
        "    tmax=tmax,\n",
        "    dt=dt,\n",
        "    a=35.0,\n",
        "    b=3.0,\n",
        "    c=28.0\n",
        ")\n",
        "\n",
        "# Discard first 2,000 points as washout\n",
        "washout = 2000\n",
        "chen_t_vals = chen_t_vals[washout:]\n",
        "chen_trajectory = chen_trajectory[washout:]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "d5b04cf1",
      "metadata": {},
      "outputs": [],
      "source": [
        "fig = plt.figure(figsize=(10, 5))\n",
        "ax = fig.add_subplot(projection='3d')\n",
        "\n",
        "colors = cm.twilight_r(np.linspace(0, 1, len(chen_trajectory)))\n",
        "\n",
        "for i in range(len(chen_trajectory) - 1):\n",
        "    ax.plot(chen_trajectory[i:i+2, 0], chen_trajectory[i:i+2, 1], chen_trajectory[i:i+2, 2],\n",
        "            color=colors[i], linewidth=1.2, alpha=0.9)\n",
        "\n",
        "ax.grid(True)\n",
        "\n",
        "ax.tick_params(axis='x', colors='none')\n",
        "ax.tick_params(axis='y', colors='none')\n",
        "ax.tick_params(axis='z', colors='none')\n",
        "\n",
        "plt.savefig(\"Figures/Chen Attractor.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "861e2f64",
      "metadata": {},
      "outputs": [],
      "source": [
        "t = np.linspace(0, len(chen_trajectory), len(chen_trajectory))\n",
        "\n",
        "plt.figure(figsize=(10, 5))\n",
        "plt.plot(t, chen_trajectory[:, 0], label='x(t)', color='r', lw=0.8)\n",
        "plt.plot(t, chen_trajectory[:, 1], label='y(t)', color='g', lw=0.8)\n",
        "plt.plot(t, chen_trajectory[:, 2], label='z(t)', color='b', lw=0.8)\n",
        "\n",
        "plt.title(\"Time Series of Chen System\")\n",
        "plt.legend()\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "ed7798bd",
      "metadata": {
        "id": "ed7798bd"
      },
      "outputs": [],
      "source": [
        "# Prepare single-step data: input(t) = [x(t), y(t), z(t)], target(t)=[x(t+1), y(t+1), z(t+1)]\n",
        "inputs = chen_trajectory[:-1]\n",
        "targets = chen_trajectory[1:]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "07a5201e",
      "metadata": {},
      "outputs": [],
      "source": [
        "train_frac = 0.7\n",
        "data_size = len(chen_trajectory)-1\n",
        "train_size = int(train_frac * (data_size - 1))\n",
        "train_input = inputs[:train_size]\n",
        "train_target = targets[1:train_size+1]\n",
        "test_input = inputs[train_size:-1]\n",
        "test_target = targets[train_size+1:]\n",
        "test_size = len(test_input)\n",
        "print(f\"Total samples: {data_size}, train size: {train_size}, test size: {test_size}\")"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "7fdf9585",
      "metadata": {
        "id": "7fdf9585"
      },
      "source": [
        "# Teacher-forced Single-step Forecasting"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "88f820ac",
      "metadata": {
        "id": "88f820ac"
      },
      "source": [
        "### Models Initialization"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "f86e34f3",
      "metadata": {
        "id": "f86e34f3"
      },
      "outputs": [],
      "source": [
        "# Baseline ESN\n",
        "esn = ESN3D(\n",
        "    reservoir_size=300,\n",
        "    spectral_radius=0.92,\n",
        "    connectivity=0.2,\n",
        "    input_scale=0.6,\n",
        "    leaking_rate=0.5,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "esn.fit_readout(train_input, train_target, discard=100)\n",
        "esn_preds = esn.predict_open_loop(test_input)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "9a78b6ff",
      "metadata": {
        "id": "9a78b6ff"
      },
      "outputs": [],
      "source": [
        "# Cycle Reservoir\n",
        "cycle_res = CR3D(\n",
        "    reservoir_size=300,\n",
        "    spectral_radius=0.98,\n",
        "    input_scale=0.8,\n",
        "    leaking_rate=0.8,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "cycle_res_preds = cycle_res.predict_open_loop(test_input)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "05d3a8ff",
      "metadata": {
        "id": "05d3a8ff"
      },
      "outputs": [],
      "source": [
        "crj = CRJ3D(\n",
        "    reservoir_size=300,\n",
        "    jump=20,\n",
        "    spectral_radius=0.98,\n",
        "    input_scale=0.7,\n",
        "    leaking_rate=0.5,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "crj.fit_readout(train_input, train_target, discard=100)\n",
        "crj_preds = crj.predict_open_loop(test_input)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "9d572da5",
      "metadata": {
        "id": "9d572da5"
      },
      "outputs": [],
      "source": [
        "mci_esn = MCI3D(\n",
        "    reservoir_size=150,\n",
        "    cycle_weight=0.6,\n",
        "    connect_weight=0.6,\n",
        "    combine_factor=0.4,\n",
        "    input_scale=0.5,\n",
        "    leaking_rate=0.9,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "mci_esn_preds = mci_esn.predict_open_loop(test_input)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "2109bae2",
      "metadata": {
        "id": "2109bae2"
      },
      "outputs": [],
      "source": [
        "deepesn = DeepESN3D(\n",
        "    num_layers=3,\n",
        "    reservoir_size=100,\n",
        "    spectral_radius=0.95,\n",
        "    connectivity=0.05,\n",
        "    input_scale=0.8,\n",
        "    leaking_rate=0.3,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "deepesn_preds = deepesn.predict_open_loop(test_input)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "47a034c5",
      "metadata": {
        "id": "47a034c5"
      },
      "outputs": [],
      "source": [
        "trigr = GliaNeuronTripartiteReservoirESN(\n",
        "    # sizes\n",
        "        reservoir_size=300,          # N\n",
        "        input_dim=3,\n",
        "        astro_nx=20,                 # grid width\n",
        "        astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "        rel_channels=128,            # P\n",
        "    \n",
        "        # kinetics / rates\n",
        "        leak_x=0.45,                 # λ\n",
        "        rate_c=0.05,                 # α\n",
        "        rate_g=0.05,                 # ρ\n",
        "        diff_D=0.5,                  # D (will be scaled safely)\n",
        "    \n",
        "        # neuron bias\n",
        "        bias=0.0,                    # scalar or length-N array\n",
        "    \n",
        "        # nonlinearities (F, Γ)\n",
        "        c_max=1.0,                   # max Ca\n",
        "        k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "        theta_c=0.0,                 # midpoint for F\n",
        "        k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "        theta_g=0.0,                 # midpoint for Γ\n",
        "        zeta=0.0,                    # tonic drive (scalar)\n",
        "        g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "        delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "    \n",
        "        # input map\n",
        "        input_scale=0.2,\n",
        "    \n",
        "        # randomization / sparsity\n",
        "        W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "        footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "        block_scale=1.0,             # base std for random blocks\n",
        "        eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "    \n",
        "        # spectral safety targets (row budgets, both < 1)\n",
        "        rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "        rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "    \n",
        "        # read-out\n",
        "        ridge_alpha=1e-6,\n",
        "        use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "        feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "    )\n",
        "trigr.fit_readout(train_input, train_target, discard=100)\n",
        "trigr_preds = trigr.predict_open_loop(test_input)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "68591f02",
      "metadata": {
        "id": "68591f02"
      },
      "source": [
        "### NRMSE Report"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "eec6145f",
      "metadata": {
        "id": "eec6145f"
      },
      "outputs": [],
      "source": [
        "# Define horizons to test\n",
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "601b147d",
      "metadata": {
        "id": "601b147d"
      },
      "outputs": [],
      "source": [
        "esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "0c55fe33",
      "metadata": {
        "id": "0c55fe33"
      },
      "outputs": [],
      "source": [
        "# Print results\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<15} {'SCR':<15} {'CRJ':<15} {'MCI-ESN':<15} {'DeepESN':<15} {'TRIGR':<15}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    print(f\"{horizon:<10} {np.mean(esn_nrmse[horizon]):<15.7f} {np.mean(cycle_res_nrmse[horizon]):<15.7f} {np.mean(crj_nrmse[horizon]):<15.7f} {np.mean(mci_esn_nrmse[horizon]):<15.7f} {np.mean(deepesn_nrmse[horizon]):<15.7f} {np.mean(trigr_nrmse[horizon]):<15.7f}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "719c161b",
      "metadata": {
        "id": "719c161b"
      },
      "outputs": [],
      "source": [
        "# Plot NRMSE vs Horizon\n",
        "plot_len=1000\n",
        "steps = list(range(10, plot_len+1, 10))\n",
        "\n",
        "plt.figure(figsize=(10, 6))\n",
        "plt.plot(steps, [np.mean(esn_nrmse[s]) for s in steps], label='ESN')\n",
        "plt.plot(steps, [np.mean(cycle_res_nrmse[s]) for s in steps], label='SCR')\n",
        "plt.plot(steps, [np.mean(crj_nrmse[s]) for s in steps], label='CRJ')\n",
        "plt.plot(steps, [np.mean(mci_esn_nrmse[s]) for s in steps], label='MCI-ESN')\n",
        "plt.plot(steps, [np.mean(deepesn_nrmse[s]) for s in steps], label='DeepESN')\n",
        "plt.plot(steps, [np.mean(trigr_nrmse[s]) for s in steps], label='TRIGR')\n",
        "plt.xlabel('Prediction Horizon')\n",
        "plt.ylabel('NRMSE')\n",
        "plt.title('NRMSE vs. Prediction Horizon (Teacher-forced Single Step Forecasting)')\n",
        "plt.legend()\n",
        "plt.savefig(\"Figures/NRMSE vs. Prediction Horizon (Teacher-forced Single Step Forecasting).png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "f23256b6",
      "metadata": {
        "id": "f23256b6"
      },
      "source": [
        "### Trajectory Plots"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "011573c4",
      "metadata": {
        "id": "011573c4"
      },
      "outputs": [],
      "source": [
        "plot_len = 999\n",
        "steps = list(range(1, plot_len+1))\n",
        "\n",
        "# Create subplots for x, y, z dimensions\n",
        "fig, axes = plt.subplots(3, 1, figsize=(12, 12))\n",
        "\n",
        "dims = ['x(t)', 'y(t)', 'z(t)']\n",
        "for i in range(3):\n",
        "    axes[i].plot(steps, test_target[:plot_len, i], label='True', linestyle='dashed')\n",
        "    # axes[i].plot(steps, esn_preds[:plot_len, i], label='ESN')\n",
        "    # axes[i].plot(steps, cycle_res_preds[:plot_len, i], label='CycleRes')\n",
        "    axes[i].plot(steps, trigr_preds[:plot_len, i], label='TRIGR')\n",
        "    axes[i].set_ylabel(dims[i])\n",
        "    axes[i].legend()\n",
        "\n",
        "axes[-1].set_xlabel('Time Step')\n",
        "fig.suptitle('Predicted Trajectories for Test Segment (Teacher-forced Single Step Forecasting)', fontsize=16)\n",
        "plt.tight_layout()\n",
        "plt.savefig(\"Figures/Predicted Trajectories for Test Segment (Teacher-forced Single Step Forecasting).png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "4b7b8819",
      "metadata": {
        "id": "4b7b8819"
      },
      "outputs": [],
      "source": [
        "fig = plt.figure(figsize=(9, 9))\n",
        "ax = fig.add_subplot(projection='3d')\n",
        "ax.plot(test_target[:plot_len,0], test_target[:plot_len,1], test_target[:plot_len,2], label='True', linestyle='dashed')\n",
        "ax.plot(trigr_preds[:plot_len,0], trigr_preds[:plot_len,1], trigr_preds[:plot_len,2], label='TRIGR')\n",
        "ax.set_title('Lorenz Phase Space Plot for Test Segment (Teacher-forced Single Step Forecasting)')\n",
        "\n",
        "ax.set_xlabel('X')\n",
        "ax.set_ylabel('Y')\n",
        "ax.set_zlabel('Z')\n",
        "\n",
        "ax.legend()\n",
        "plt.savefig(\"Figures/Lorenz Phase Space Plot for Test Segment (Teacher-forced Single Step Forecasting).png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "49c6b1e1",
      "metadata": {
        "id": "49c6b1e1"
      },
      "source": [
        "# Autoregressive Forecasting"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "cc088a7c",
      "metadata": {
        "id": "cc088a7c"
      },
      "outputs": [],
      "source": [
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "daa3be57",
      "metadata": {
        "id": "daa3be57"
      },
      "source": [
        "### Models Initialization"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "963e69e6",
      "metadata": {
        "id": "963e69e6"
      },
      "outputs": [],
      "source": [
        "# Baseline ESN\n",
        "esn = ESN3D(\n",
        "    reservoir_size=300,\n",
        "    spectral_radius=0.92,\n",
        "    connectivity=0.2,\n",
        "    input_scale=0.6,\n",
        "    leaking_rate=0.9,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "esn.fit_readout(train_input, train_target, discard=100)\n",
        "esn_preds = esn.predict_autoregressive(initial_input, num_steps)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "9ee16356",
      "metadata": {
        "id": "9ee16356"
      },
      "outputs": [],
      "source": [
        "# Cycle Reservoir\n",
        "cycle_res = CR3D(\n",
        "    reservoir_size=300,\n",
        "    spectral_radius=0.98,\n",
        "    input_scale=0.8,\n",
        "    leaking_rate=0.8,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "cycle_res_preds = cycle_res.predict_autoregressive(initial_input, num_steps)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "2fb5d3ad",
      "metadata": {
        "id": "2fb5d3ad"
      },
      "outputs": [],
      "source": [
        "crj = CRJ3D(\n",
        "    reservoir_size=300,\n",
        "    jump=20,\n",
        "    spectral_radius=0.98,\n",
        "    input_scale=0.7,\n",
        "    leaking_rate=0.5,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "crj.fit_readout(train_input, train_target, discard=100)\n",
        "crj_preds = crj.predict_autoregressive(initial_input, num_steps)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "41ead3cd",
      "metadata": {
        "id": "41ead3cd"
      },
      "outputs": [],
      "source": [
        "mci_esn = MCI3D(\n",
        "    reservoir_size=150,\n",
        "    cycle_weight=0.6,\n",
        "    connect_weight=0.6,\n",
        "    combine_factor=0.4,\n",
        "    input_scale=0.5,\n",
        "    leaking_rate=0.9,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "mci_esn_preds = mci_esn.predict_autoregressive(initial_input, num_steps)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "20c6352f",
      "metadata": {
        "id": "20c6352f"
      },
      "outputs": [],
      "source": [
        "deepesn = DeepESN3D(\n",
        "    num_layers=3,\n",
        "    reservoir_size=100,\n",
        "    spectral_radius=0.95,\n",
        "    connectivity=0.05,\n",
        "    input_scale=0.8,\n",
        "    leaking_rate=0.3,\n",
        "    ridge_alpha=1e-6,\n",
        "    seed=1002\n",
        ")\n",
        "deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "deepesn_preds = deepesn.predict_autoregressive(initial_input, num_steps)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a64e256e",
      "metadata": {
        "id": "a64e256e"
      },
      "outputs": [],
      "source": [
        "trigr = GliaNeuronTripartiteReservoirESN(\n",
        "    # sizes\n",
        "    reservoir_size=300,          # N\n",
        "    input_dim=3,\n",
        "    astro_nx=20,                 # grid width\n",
        "    astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "    rel_channels=128,            # P\n",
        "\n",
        "    # kinetics / rates\n",
        "    leak_x=0.45,                 # λ\n",
        "    rate_c=0.05,                 # α\n",
        "    rate_g=0.05,                 # ρ\n",
        "    diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "    # neuron bias\n",
        "    bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "    # nonlinearities (F, Γ)\n",
        "    c_max=1.0,                   # max Ca\n",
        "    k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "    theta_c=0.0,                 # midpoint for F\n",
        "    k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "    theta_g=0.0,                 # midpoint for Γ\n",
        "    zeta=0.0,                    # tonic drive (scalar)\n",
        "    g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "    delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "    # input map\n",
        "    input_scale=0.2,\n",
        "\n",
        "    # randomization / sparsity\n",
        "    W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "    footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "    block_scale=1.0,             # base std for random blocks\n",
        "    eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "    # spectral safety targets (row budgets, both < 1)\n",
        "    rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "    rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "    # read-out\n",
        "    ridge_alpha=1e-6,\n",
        "    use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "    feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        ")\n",
        "trigr.fit_readout(train_input, train_target, discard=100)\n",
        "trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "c7c48b24",
      "metadata": {
        "id": "c7c48b24"
      },
      "source": [
        "### NRMSE Report"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "39c520c4",
      "metadata": {
        "id": "39c520c4"
      },
      "outputs": [],
      "source": [
        "esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "\n",
        "# Print results\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 120)\n",
        "print(f\"{'Horizon':<10} {'ESN':<15} {'SCR':<15} {'CRJ':<15} {'MCI-ESN':<15} {'DeepESN':<15} {'TRIGR':<15}\")\n",
        "print(\"-\" * 120)\n",
        "\n",
        "for horizon in horizons:\n",
        "    print(f\"{horizon:<10} {np.mean(esn_nrmse[horizon]):<15.7f} {np.mean(cycle_res_nrmse[horizon]):<15.7f} {np.mean(crj_nrmse[horizon]):<15.7f} {np.mean(mci_esn_nrmse[horizon]):<15.7f} {np.mean(deepesn_nrmse[horizon]):<15.7f} {np.mean(trigr_nrmse[horizon]):<15.7f}\")"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "bcaacbdc",
      "metadata": {
        "id": "bcaacbdc"
      },
      "source": [
        "### VPT Report"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "acf3f06c",
      "metadata": {
        "id": "acf3f06c"
      },
      "outputs": [],
      "source": [
        "lle_lorenz = 0.830\n",
        "lyapunov_time_lorenz = 1.0 / lle_lorenz\n",
        "VPT_threshold = 0.3\n",
        "test_time = np.arange(test_size)*dt\n",
        "\n",
        "esn_VPT, esn_VPT_ratio = compute_valid_prediction_time(test_target, esn_preds, test_time, lyapunov_time_lorenz, VPT_threshold)\n",
        "cycle_res_VPT, cycle_res_VPT_ratio = compute_valid_prediction_time(test_target, cycle_res_preds, test_time, lyapunov_time_lorenz, VPT_threshold)\n",
        "crj_VPT, crj_VPT_ratio = compute_valid_prediction_time(test_target, crj_preds, test_time, lyapunov_time_lorenz, VPT_threshold)\n",
        "mci_esn_VPT, mci_esn_VPT_ratio = compute_valid_prediction_time(test_target, mci_esn_preds, test_time, lyapunov_time_lorenz, VPT_threshold)\n",
        "deepesn_VPT, deepesn_VPT_ratio = compute_valid_prediction_time(test_target, deepesn_preds, test_time, lyapunov_time_lorenz, VPT_threshold)\n",
        "trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time_lorenz, VPT_threshold)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "60977aee",
      "metadata": {
        "id": "60977aee"
      },
      "outputs": [],
      "source": [
        "print(f\"{'':<20} {'ESN':<15} {'SCR':<15} {'CRJ':<15} {'MCI-ESN':<15} {'DeepESN':<15} {'TRIGR':<15}\")\n",
        "print(\"-\" * 130)\n",
        "print(f\"{'T_VPT':<20} {esn_VPT:<15.3f} {cycle_res_VPT:<15.3f} {crj_VPT:<15.3f} {mci_esn_VPT:<15.3f} {deepesn_VPT:<15.3f} {trigr_VPT:<15.3f}\")\n",
        "print(f\"{'T_VPT/T_lambda':<20} {esn_VPT_ratio:<15.3f} {cycle_res_VPT_ratio:<15.3f} {crj_VPT_ratio:<15.3f} {mci_esn_VPT_ratio:<15.3f} {deepesn_VPT_ratio:<15.3f} {trigr_VPT_ratio:<15.3f}\")"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "8aea9f1f",
      "metadata": {
        "id": "8aea9f1f"
      },
      "source": [
        "### Adev Report"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "ae0611e6",
      "metadata": {
        "id": "ae0611e6"
      },
      "outputs": [],
      "source": [
        "cube_size = (4, 4, 4)\n",
        "esn_adev = compute_attractor_deviation(esn_preds, test_target, cube_size)\n",
        "cycle_res_adev = compute_attractor_deviation(cycle_res_preds, test_target, cube_size)\n",
        "crj_adev = compute_attractor_deviation(crj_preds, test_target, cube_size)\n",
        "mci_esn_adev = compute_attractor_deviation(mci_esn_preds, test_target, cube_size)\n",
        "deepesn_adev = compute_attractor_deviation(deepesn_preds, test_target, cube_size)\n",
        "trigr_adev = compute_attractor_deviation(trigr_preds, test_target, cube_size)\n",
        "\n",
        "print(f\"{'':<20} {'ESN':<15} {'SCR':<15} {'CRJ':<15} {'MCI-ESN':<15} {'DeepESN':<15} {'TRIGR':<15}\")\n",
        "print(\"-\" * 130)\n",
        "print(f\"{'ADev':<20} {esn_adev:<15} {cycle_res_adev:<15} {crj_adev:<15} {mci_esn_adev:<15} {deepesn_adev:<15} {trigr_adev:<15}\")"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "bf706aa5",
      "metadata": {
        "id": "bf706aa5"
      },
      "source": [
        "### PSD Report"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "150d3d30",
      "metadata": {
        "id": "150d3d30"
      },
      "outputs": [],
      "source": [
        "target_freqs, target_psd = compute_psd(test_target, dt=dt)\n",
        "esn_freqs, esn_psd = compute_psd(esn_preds, dt=dt)\n",
        "# cycle_res_freqs, cycle_res_psd = compute_psd(cycle_res_preds, dt=dt)\n",
        "# crj_freqs, crj_psd = compute_psd(crj_preds, dt=dt)\n",
        "# mci_esn_freqs, mci_esn_psd = compute_psd(mci_esn_preds, dt=dt)\n",
        "# deepesn_freqs, deepesn_psd = compute_psd(deepesn_preds, dt=dt)\n",
        "trigr_freqs, trigr_psd = compute_psd(trigr_preds, dt=dt)\n",
        "\n",
        "\n",
        "# Plot the PSDs\n",
        "mask = target_freqs <= 3\n",
        "plt.figure(figsize=(5, 6))\n",
        "\n",
        "# True signal\n",
        "plt.semilogy(target_freqs[mask], target_psd[mask], label='True', linewidth=1.5, color='#108B8B')\n",
        "\n",
        "plt.semilogy(esn_freqs[mask], esn_psd[mask], label='ESN', linewidth=1.5, color='#EC6113')\n",
        "\n",
        "# Labels and formatting\n",
        "plt.xlabel('Frequency (Hz)', fontsize=12)\n",
        "plt.ylabel('Power Spectral Density', fontsize=12)\n",
        "# plt.legend(fontsize=11, frameon=False)\n",
        "plt.grid(True, linestyle='--', linewidth=0.5, alpha=0.0)\n",
        "plt.legend(fontsize=11, frameon=False, loc='best')\n",
        "\n",
        "plt.tight_layout()\n",
        "plt.savefig(\"Figures/PSD_vs_Frequency_rossler_esn.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()\n",
        "\n"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "fb25fc60",
      "metadata": {
        "id": "fb25fc60"
      },
      "source": [
        "### Trajectory Plots"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "76357443",
      "metadata": {
        "id": "76357443"
      },
      "outputs": [],
      "source": [
        "sns.set(style=\"whitegrid\")\n",
        "\n",
        "plot_len = 999\n",
        "steps = list(range(1, plot_len + 1))\n",
        "\n",
        "fig, axes = plt.subplots(3, 1, figsize=(14, 10), sharex=True)\n",
        "\n",
        "dims = ['x(t)', 'y(t)', 'z(t)']\n",
        "line_labels = ['True', 'DeepESN']\n",
        "line_styles = ['--', '-']\n",
        "line_colors = ['#2c3e94', '#e25822']\n",
        "\n",
        "for i in range(3):\n",
        "    axes[i].plot(steps, test_target[:plot_len, i], label=line_labels[0],\n",
        "                 linestyle=line_styles[0], linewidth=2.5, color=line_colors[0])\n",
        "    axes[i].plot(steps, deepesn_preds[:plot_len, i], label=line_labels[1],\n",
        "                 linestyle=line_styles[1], linewidth=2.5, color=line_colors[1])\n",
        "\n",
        "    axes[i].set_ylabel(dims[i], fontsize=13)\n",
        "    axes[i].legend(loc='upper right', fontsize=11, frameon=True)\n",
        "    axes[i].tick_params(axis='both', which='major', labelsize=11)\n",
        "    axes[i].grid(True, linestyle='--', linewidth=0.6, alpha=0.0)\n",
        "\n",
        "axes[-1].set_xlabel('Time Step', fontsize=13)\n",
        "# fig.suptitle('Predicted Trajectories for Test Segment (Autoregressive Forecasting)',\n",
        "#              fontsize=18, fontweight='bold')\n",
        "\n",
        "plt.tight_layout(rect=[0, 0.03, 1, 0.95])\n",
        "plt.savefig(\"Figures/Predicted Trajectories for Lorenz Test Segment - DeepESN.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "72e10fd4",
      "metadata": {
        "id": "72e10fd4"
      },
      "outputs": [],
      "source": [
        "fig = plt.figure(figsize=(10, 5))\n",
        "ax = fig.add_subplot(projection='3d')\n",
        "\n",
        "# Plot True vs Predicted\n",
        "line, = ax.plot(deepesn_preds[:plot_len, 0],\n",
        "                deepesn_preds[:plot_len, 1],\n",
        "                deepesn_preds[:plot_len, 2],\n",
        "                label='True Trajectory',\n",
        "                linewidth=2,\n",
        "                color='#F64C72')\n",
        "line.set_dashes([4, 0.5])\n",
        "\n",
        "ax.grid(True)\n",
        "\n",
        "ax.tick_params(axis='x', colors='none')\n",
        "ax.tick_params(axis='y', colors='none')\n",
        "ax.tick_params(axis='z', colors='none')\n",
        "# Save the figure\n",
        "plt.savefig(\"Figures/Test Segment Lorenz - DeepESN.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "85d38716",
      "metadata": {
        "id": "85d38716"
      },
      "outputs": [],
      "source": [
        "fig = plt.figure(figsize=(10, 5))\n",
        "ax = fig.add_subplot(projection='3d')\n",
        "\n",
        "# Define the color map based on the number of segments\n",
        "colors = cm.twilight(np.linspace(0, 1, len(test_target[:plot_len])))\n",
        "\n",
        "# Plot each segment of the trajectory with its corresponding color\n",
        "for i in range(plot_len - 1):\n",
        "    ax.plot(trigr_preds[i:i+2, 0],\n",
        "            trigr_preds[i:i+2, 1],\n",
        "            trigr_preds[i:i+2, 2],\n",
        "            color=colors[i], linewidth=1.5, alpha=0.9)\n",
        "\n",
        "# Add grid and hide tick marks\n",
        "ax.grid(True)\n",
        "ax.tick_params(axis='x', colors='none')\n",
        "ax.tick_params(axis='y', colors='none')\n",
        "ax.tick_params(axis='z', colors='none')\n",
        "\n",
        "plt.savefig(\"Figures/Lorenz Phase Space — Test Segment (Autoregressive Forecasting).png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "8962b6fd",
      "metadata": {
        "id": "8962b6fd"
      },
      "source": [
        "# Experiments"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "28a844ec",
      "metadata": {
        "id": "28a844ec"
      },
      "source": [
        "## Experiments on Lorenz Dataset under Autoregressive Forecasting"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "7e6464a5",
      "metadata": {
        "id": "7e6464a5"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_lorenz = 0.9\n",
        "lyapunov_time_lorenz = 1.0 / lle_lorenz\n",
        "lyapunov_time = lyapunov_time_lorenz\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.7,0.75,0.8]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "VPT_dict = defaultdict(list)\n",
        "VPT_ratio_dict = defaultdict(list)\n",
        "adev_dict = defaultdict(list)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "9c3efbc1",
      "metadata": {
        "id": "9c3efbc1"
      },
      "outputs": [],
      "source": [
        "nrmse_dict['ESN'] = []\n",
        "VPT_dict['ESN'] = []\n",
        "VPT_ratio_dict['ESN'] = []\n",
        "adev_dict['ESN'] = []\n",
        "\n",
        "nrmse_dict['SCR'] = []\n",
        "VPT_dict['SCR'] = []\n",
        "VPT_ratio_dict['SCR'] = []\n",
        "adev_dict['SCR'] = []\n",
        "\n",
        "nrmse_dict['CRJ'] = []\n",
        "VPT_dict['CRJ'] = []\n",
        "VPT_ratio_dict['CRJ'] = []\n",
        "adev_dict['CRJ'] = []\n",
        "\n",
        "nrmse_dict['MCI-ESN'] = []\n",
        "VPT_dict['MCI-ESN'] = []\n",
        "VPT_ratio_dict['MCI-ESN'] = []\n",
        "adev_dict['MCI-ESN'] = []\n",
        "\n",
        "nrmse_dict['DeepESN'] = []\n",
        "VPT_dict['DeepESN'] = []\n",
        "VPT_ratio_dict['DeepESN'] = []\n",
        "adev_dict['DeepESN'] = []\n",
        "\n",
        "nrmse_dict['TRIGR'] = []\n",
        "VPT_dict['TRIGR'] = []\n",
        "VPT_ratio_dict['TRIGR'] = []\n",
        "adev_dict['TRIGR'] = []"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "1816e8b7",
      "metadata": {
        "id": "1816e8b7"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, lorenz_traj = generate_lorenz_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(lorenz_traj)\n",
        "    lorenz_traj = scaler.transform(lorenz_traj)\n",
        "    T_data = len(lorenz_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = lorenz_traj[:train_end]\n",
        "        train_target = lorenz_traj[1:train_end + 1]\n",
        "        test_input = lorenz_traj[train_end:-1]\n",
        "        test_target = lorenz_traj[train_end + 1:]\n",
        "        num_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            esn = ESN3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.92,\n",
        "                connectivity=0.2,\n",
        "                input_scale=0.6,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            esn.fit_readout(train_input, train_target, discard=100)\n",
        "            esn_preds = esn.predict_autoregressive(initial_input, num_steps)\n",
        "            esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['ESN'].append(esn_nrmse)\n",
        "            esn_VPT, esn_VPT_ratio = compute_valid_prediction_time(test_target, esn_preds, test_time, lyapunov_time, VPT_threshold,dt)\n",
        "            VPT_dict['ESN'].append(esn_VPT)\n",
        "            VPT_ratio_dict['ESN'].append(esn_VPT_ratio)\n",
        "            esn_adev = compute_attractor_deviation(esn_preds, test_target)\n",
        "            adev_dict['ESN'].append(esn_adev)\n",
        "\n",
        "\n",
        "            cycle_res = CR3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.8,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "            cycle_res_preds = cycle_res.predict_autoregressive(initial_input, num_steps)\n",
        "            cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "            cycle_res_VPT, cycle_res_VPT_ratio = compute_valid_prediction_time(test_target, cycle_res_preds, test_time, lyapunov_time, VPT_threshold, dt)\n",
        "            VPT_dict['SCR'].append(cycle_res_VPT)\n",
        "            VPT_ratio_dict['SCR'].append(cycle_res_VPT_ratio)\n",
        "            cycle_res_adev = compute_attractor_deviation(cycle_res_preds, test_target)\n",
        "            adev_dict['SCR'].append(cycle_res_adev)\n",
        "\n",
        "            crj = CRJ3D(\n",
        "                reservoir_size=300,\n",
        "                jump=20,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.7,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            crj.fit_readout(train_input, train_target, discard=100)\n",
        "            crj_preds = crj.predict_autoregressive(initial_input, num_steps)\n",
        "            crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "            nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "            crj_VPT, crj_VPT_ratio = compute_valid_prediction_time(test_target, crj_preds, test_time, lyapunov_time, VPT_threshold, dt)\n",
        "            VPT_dict['CRJ'].append(crj_VPT)\n",
        "            VPT_ratio_dict['CRJ'].append(crj_VPT_ratio)\n",
        "            crj_adev = compute_attractor_deviation(crj_preds, test_target)\n",
        "            adev_dict['CRJ'].append(crj_adev)\n",
        "\n",
        "            mci_esn = MCI3D(\n",
        "                reservoir_size=300,\n",
        "                cycle_weight=0.6,\n",
        "                connect_weight=0.6,\n",
        "                combine_factor=0.4,\n",
        "                input_scale=0.5,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            mci_esn_preds = mci_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "            mci_esn_VPT, mci_esn_VPT_ratio = compute_valid_prediction_time(test_target, mci_esn_preds, test_time, lyapunov_time, VPT_threshold, dt)\n",
        "            VPT_dict['MCI-ESN'].append(mci_esn_VPT)\n",
        "            VPT_ratio_dict['MCI-ESN'].append(mci_esn_VPT_ratio)\n",
        "            mci_esn_adev = compute_attractor_deviation(mci_esn_preds, test_target)\n",
        "            adev_dict['MCI-ESN'].append(mci_esn_adev)\n",
        "\n",
        "            deepesn = DeepESN3D(\n",
        "                num_layers=3,\n",
        "                reservoir_size=100,\n",
        "                spectral_radius=0.95,\n",
        "                connectivity=0.05,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.3,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "            deepesn_preds = deepesn.predict_autoregressive(initial_input, num_steps)\n",
        "            deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "            deepesn_VPT, deepesn_VPT_ratio = compute_valid_prediction_time(test_target, deepesn_preds, test_time, lyapunov_time, VPT_threshold, dt)\n",
        "            VPT_dict['DeepESN'].append(deepesn_VPT)\n",
        "            VPT_ratio_dict['DeepESN'].append(deepesn_VPT_ratio)\n",
        "            deepesn_adev = compute_attractor_deviation(deepesn_preds, test_target)\n",
        "            adev_dict['DeepESN'].append(deepesn_adev)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TRIGR'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold, dt)\n",
        "            VPT_dict['TRIGR'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['TRIGR'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['TRIGR'].append(trigr_adev)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "d813e362",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "59a60185",
      "metadata": {},
      "outputs": [],
      "source": [
        "plot_len = 1000\n",
        "steps = list(range(10, plot_len + 1, 10))\n",
        "marker_steps = [10, 200, 400, 600, 800, 1000]\n",
        "\n",
        "models = {\n",
        "    'ESN': esn_nrmse,\n",
        "    'SCR': cycle_res_nrmse,\n",
        "    'CRJ': crj_nrmse,\n",
        "    'MCI-ESN': mci_esn_nrmse,\n",
        "    'DeepESN': deepesn_nrmse,\n",
        "    'TRIGR': trigr_nrmse\n",
        "}\n",
        "\n",
        "# Assign a unique marker and color style for each\n",
        "colors = plt.cm.tab10.colors\n",
        "markers = ['o', 's', 'D', '^', 'v', 'P', 'X']\n",
        "\n",
        "plt.figure(figsize=(5, 6))\n",
        "\n",
        "for i, (name, data) in enumerate(models.items()):\n",
        "    values = [np.mean(data[s]) for s in steps]\n",
        "    color = colors[i % len(colors)]\n",
        "    marker = markers[i % len(markers)]\n",
        "    values = []\n",
        "\n",
        "    for horizon in all_horizons:\n",
        "        # Get all NRMSE values across all runs for this model and this horizon\n",
        "        all_vals = []\n",
        "        for run in nrmse_dict[name]:\n",
        "            all_vals.extend([np.mean(run[horizon])])\n",
        "        values.append(np.mean(all_vals))\n",
        "\n",
        "    # Plot with markers so legend also shows them\n",
        "    plt.plot(steps, values, label=name, linewidth=2.2, color=color,\n",
        "             marker=marker, markevery=[steps.index(s) for s in marker_steps if s in steps],\n",
        "             markersize=7)\n",
        "\n",
        "# Labels and title\n",
        "plt.xlabel('Prediction Horizon', fontsize=12)\n",
        "plt.ylabel('NRMSE', fontsize=12)\n",
        "# plt.title('NRMSE vs. Prediction Horizon (Autoregressive Forecasting)', fontsize=14, fontweight='bold')\n",
        "plt.grid(True, linestyle='--', linewidth=0.6, alpha=0.6)\n",
        "plt.legend(fontsize=9, ncol=2, loc='upper left')\n",
        "plt.tight_layout()\n",
        "plt.savefig(\"Figures/NRMSE_vs_Prediction_Horizon_AR_Lorenz.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "7e6d6212",
      "metadata": {},
      "outputs": [],
      "source": [
        "import matplotlib.pyplot as plt\n",
        "import seaborn as sns\n",
        "import pandas as pd\n",
        "\n",
        "target_horizon = 1000\n",
        "\n",
        "records = []\n",
        "for model_name in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    model_vals = [np.mean(entry[target_horizon]) for entry in nrmse_dict[model_name]]\n",
        "    for val in model_vals:\n",
        "        records.append({\n",
        "            \"Model\": model_name,\n",
        "            \"NRMSE\": val\n",
        "        })\n",
        "\n",
        "df = pd.DataFrame(records)\n",
        "\n",
        "# ─── PLOTTING ──────────────────────────────────────────────────────────────\n",
        "sns.set(style=\"whitegrid\")\n",
        "plt.figure(figsize=(6, 6))\n",
        "\n",
        "sns.boxplot(data=df, x='Model', y='Value', palette='Set2', showfliers=False)\n",
        "# plt.title(f'Boxplot of NRMSE at Horizon {target_horizon}')\n",
        "plt.ylabel('NRMSE')\n",
        "plt.xticks(rotation=45)\n",
        "plt.grid(True, linestyle='--', alpha=0.5)\n",
        "plt.tight_layout()\n",
        "plt.savefig(f\"BoxPlot_NRMSE_H{target_horizon}_Lorenz-trigr.png\", dpi=400)\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c72d3659",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(f\"{'':<20} {'ESN':<20} {'SCR':<20} {'CRJ':<20} {'MCI-ESN':<20} {'DeepESN':<20} {'TRIGR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'T_VPT':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    mean = np.mean(VPT_dict[model])\n",
        "    std = np.std(VPT_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "\n",
        "print(f\"{'T_VPT/T_lambda':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    mean = np.mean(VPT_ratio_dict[model])\n",
        "    std = np.std(VPT_ratio_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "39b8ffb8",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(f\"{'':<20} {'ESN':<20} {'SCR':<20} {'CRJ':<20} {'MCI-ESN':<20} {'DeepESN':<20} {'TRIGR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'ADev':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    values = adev_dict[model]\n",
        "    mean = np.mean(values)\n",
        "    mad = np.mean(np.abs(values - mean))\n",
        "    print(f\"{mean:.2f} ± {mad:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "4afac07e",
      "metadata": {
        "id": "4afac07e"
      },
      "source": [
        "## Experiments on Lorenz Dataset in Teacher-forced setting"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "30ccc83a",
      "metadata": {
        "id": "30ccc83a"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "9a2f0154",
      "metadata": {
        "id": "9a2f0154"
      },
      "outputs": [],
      "source": [
        "nrmse_dict['ESN'] = []\n",
        "nrmse_dict['SCR'] = []\n",
        "nrmse_dict['CRJ'] = []\n",
        "nrmse_dict['MCI-ESN'] = []\n",
        "nrmse_dict['DeepESN'] = []\n",
        "nrmse_dict['TRIGR'] = []"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c440ac10",
      "metadata": {
        "id": "c440ac10"
      },
      "outputs": [],
      "source": [
        "nrmse_dict['ESN'] = []\n",
        "\n",
        "for initial_state in initial_states:\n",
        "    t_vals, lorenz_traj = generate_lorenz_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(lorenz_traj)\n",
        "    lorenz_traj = scaler.transform(lorenz_traj)\n",
        "    T_data = len(lorenz_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = lorenz_traj[:train_end]\n",
        "        train_target = lorenz_traj[1:train_end + 1]\n",
        "        test_input = lorenz_traj[train_end:-1]\n",
        "        test_target = lorenz_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            esn = ESN3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.92,\n",
        "                connectivity=0.2,\n",
        "                input_scale=0.6,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            esn.fit_readout(train_input, train_target, discard=100)\n",
        "            esn_preds = esn.predict_open_loop(test_input)\n",
        "            esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['ESN'].append(esn_nrmse)\n",
        "\n",
        "\n",
        "            cycle_res = CR3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.8,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "            cycle_res_preds = cycle_res.predict_autoregressive(initial_input, num_steps)\n",
        "            cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "\n",
        "            crj = CRJ3D(\n",
        "                reservoir_size=300,\n",
        "                jump=20,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.7,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            crj.fit_readout(train_input, train_target, discard=100)\n",
        "            crj_preds = crj.predict_autoregressive(initial_input, num_steps)\n",
        "            crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "            nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "\n",
        "            mci_esn = MCI3D(\n",
        "                reservoir_size=300,\n",
        "                cycle_weight=0.6,\n",
        "                connect_weight=0.6,\n",
        "                combine_factor=0.4,\n",
        "                input_scale=0.5,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            mci_esn_preds = mci_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "\n",
        "            deepesn = DeepESN3D(\n",
        "                num_layers=3,\n",
        "                reservoir_size=100,\n",
        "                spectral_radius=0.95,\n",
        "                connectivity=0.05,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.3,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "            deepesn_preds = deepesn.predict_autoregressive(initial_input, num_steps)\n",
        "            deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                    reservoir_size=300,\n",
        "                    n_astrocytes = 20,\n",
        "                    input_dim=3,\n",
        "                    rho_star=0.92,\n",
        "                    alpha=1,\n",
        "                    tau_c=200,\n",
        "                    eta=0.74,\n",
        "                    D_diff=0.15,\n",
        "                    theta=0.38,\n",
        "                    gamma_glia=0.19,\n",
        "                    input_scale=0.9,\n",
        "                    ridge_alpha=1e-6,\n",
        "                    seed=seed\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TRIGR'].append(trigr_nrmse)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "d8082c68",
      "metadata": {
        "id": "d8082c68"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean*10000:.4f} ± {std*10000:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "8b43b45c",
      "metadata": {
        "id": "8b43b45c"
      },
      "source": [
        "## Experiments on Rossler Dataset under Autoregressive Forecasting"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "179a736b",
      "metadata": {
        "id": "179a736b"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_rossler = 0.071\n",
        "lyapunov_time_rossler = 1.0 / lle_rossler\n",
        "lyapunov_time = lyapunov_time_rossler\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.3, 0.35, 0.4]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "VPT_dict = defaultdict(list)\n",
        "VPT_ratio_dict = defaultdict(list)\n",
        "adev_dict = defaultdict(list)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "HTXT5hPbDFHR",
      "metadata": {
        "id": "HTXT5hPbDFHR"
      },
      "outputs": [],
      "source": [
        "nrmse_dict['ESN'] = []\n",
        "VPT_dict['ESN'] = []\n",
        "VPT_ratio_dict['ESN'] = []\n",
        "adev_dict['ESN'] = []\n",
        "\n",
        "nrmse_dict['SCR'] = []\n",
        "VPT_dict['SCR'] = []\n",
        "VPT_ratio_dict['SCR'] = []\n",
        "adev_dict['SCR'] = []\n",
        "\n",
        "nrmse_dict['CRJ'] = []\n",
        "VPT_dict['CRJ'] = []\n",
        "VPT_ratio_dict['CRJ'] = []\n",
        "adev_dict['CRJ'] = []\n",
        "\n",
        "nrmse_dict['MCI-ESN'] = []\n",
        "VPT_dict['MCI-ESN'] = []\n",
        "VPT_ratio_dict['MCI-ESN'] = []\n",
        "adev_dict['MCI-ESN'] = []\n",
        "\n",
        "nrmse_dict['DeepESN'] = []\n",
        "VPT_dict['DeepESN'] = []\n",
        "VPT_ratio_dict['DeepESN'] = []\n",
        "adev_dict['DeepESN'] = []\n",
        "\n",
        "nrmse_dict['TRIGR'] = []\n",
        "VPT_dict['TRIGR'] = []\n",
        "VPT_ratio_dict['TRIGR'] = []\n",
        "adev_dict['TRIGR'] = []"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "KkpS4P1XAzqg",
      "metadata": {
        "id": "KkpS4P1XAzqg"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, rossler_traj = generate_rossler_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    rossler_traj = rossler_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(rossler_traj)\n",
        "    rossler_traj = scaler.transform(rossler_traj)\n",
        "    T_data = len(rossler_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = rossler_traj[:train_end]\n",
        "        train_target = rossler_traj[1:train_end + 1]\n",
        "        test_input = rossler_traj[train_end:-1]\n",
        "        test_target = rossler_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            # Baseline ESN\n",
        "            esn = ESN3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.92,\n",
        "                connectivity=0.2,\n",
        "                input_scale=0.6,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            esn.fit_readout(train_input, train_target, discard=100)\n",
        "            esn_preds = esn.predict_autoregressive(initial_input, num_steps)\n",
        "            esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['ESN'].append(esn_nrmse)\n",
        "            esn_VPT, esn_VPT_ratio = compute_valid_prediction_time(test_target, esn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['ESN'].append(esn_VPT)\n",
        "            VPT_ratio_dict['ESN'].append(esn_VPT_ratio)\n",
        "            esn_adev = compute_attractor_deviation(esn_preds, test_target)\n",
        "            adev_dict['ESN'].append(esn_adev)\n",
        "\n",
        "\n",
        "            # Cycle Reservoir\n",
        "            cycle_res = CR3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.8,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "            cycle_res_preds = cycle_res.predict_autoregressive(initial_input, num_steps)\n",
        "            cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "            cycle_res_VPT, cycle_res_VPT_ratio = compute_valid_prediction_time(test_target, cycle_res_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['SCR'].append(cycle_res_VPT)\n",
        "            VPT_ratio_dict['SCR'].append(cycle_res_VPT_ratio)\n",
        "            cycle_res_adev = compute_attractor_deviation(cycle_res_preds, test_target)\n",
        "            adev_dict['SCR'].append(cycle_res_adev)\n",
        "\n",
        "            crj = CRJ3D(\n",
        "                reservoir_size=300,\n",
        "                jump=20,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.7,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            crj.fit_readout(train_input, train_target, discard=100)\n",
        "            crj_preds = crj.predict_autoregressive(initial_input, num_steps)\n",
        "            crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "            nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "            crj_VPT, crj_VPT_ratio = compute_valid_prediction_time(test_target, crj_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['CRJ'].append(crj_VPT)\n",
        "            VPT_ratio_dict['CRJ'].append(crj_VPT_ratio)\n",
        "            crj_adev = compute_attractor_deviation(crj_preds, test_target)\n",
        "            adev_dict['CRJ'].append(crj_adev)\n",
        "\n",
        "            mci_esn = MCI3D(\n",
        "                reservoir_size=150,\n",
        "                cycle_weight=0.6,\n",
        "                connect_weight=0.6,\n",
        "                combine_factor=0.4,\n",
        "                input_scale=0.5,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            mci_esn_preds = mci_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "            mci_esn_VPT, mci_esn_VPT_ratio = compute_valid_prediction_time(test_target, mci_esn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['MCI-ESN'].append(mci_esn_VPT)\n",
        "            VPT_ratio_dict['MCI-ESN'].append(mci_esn_VPT_ratio)\n",
        "            mci_esn_adev = compute_attractor_deviation(mci_esn_preds, test_target)\n",
        "            adev_dict['MCI-ESN'].append(mci_esn_adev)\n",
        "\n",
        "            deepesn = DeepESN3D(\n",
        "                num_layers=3,\n",
        "                reservoir_size=100,\n",
        "                spectral_radius=0.95,\n",
        "                connectivity=0.05,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.3,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "            deepesn_preds = deepesn.predict_autoregressive(initial_input, num_steps)\n",
        "            deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "            deepesn_VPT, deepesn_VPT_ratio = compute_valid_prediction_time(test_target, deepesn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['DeepESN'].append(deepesn_VPT)\n",
        "            VPT_ratio_dict['DeepESN'].append(deepesn_VPT_ratio)\n",
        "            deepesn_adev = compute_attractor_deviation(deepesn_preds, test_target)\n",
        "            adev_dict['DeepESN'].append(deepesn_adev)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TRIGR'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['TRIGR'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['TRIGR'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['TRIGR'].append(trigr_adev)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "5c2a8374",
      "metadata": {
        "id": "5c2a8374"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "82b7cd5a",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "742c9fc5",
      "metadata": {},
      "outputs": [],
      "source": [
        "plot_len = 1000\n",
        "steps = list(range(10, plot_len + 1, 10))\n",
        "marker_steps = [10, 200, 400, 600, 800, 1000]\n",
        "\n",
        "models = {\n",
        "    'ESN': esn_nrmse,\n",
        "    'SCR': cycle_res_nrmse,\n",
        "    'CRJ': crj_nrmse,\n",
        "    'MCI-ESN': mci_esn_nrmse,\n",
        "    'DeepESN': deepesn_nrmse,\n",
        "    'TRIGR': trigr_nrmse\n",
        "}\n",
        "\n",
        "# Assign a unique marker and color style for each\n",
        "colors = plt.cm.tab10.colors\n",
        "markers = ['o', 's', 'D', '^', 'v', 'P', 'X']\n",
        "\n",
        "plt.figure(figsize=(5, 6))\n",
        "\n",
        "for i, (name, data) in enumerate(models.items()):\n",
        "    values = [np.mean(data[s]) for s in steps]\n",
        "    color = colors[i % len(colors)]\n",
        "    marker = markers[i % len(markers)]\n",
        "    values = []\n",
        "\n",
        "    for horizon in all_horizons:\n",
        "        # Get all NRMSE values across all runs for this model and this horizon\n",
        "        all_vals = []\n",
        "        for run in nrmse_dict[name]:\n",
        "            all_vals.extend([np.mean(run[horizon])])\n",
        "        values.append(np.mean(all_vals))\n",
        "\n",
        "    # Plot with markers so legend also shows them\n",
        "    plt.plot(steps, values, label=name, linewidth=2.2, color=color,\n",
        "             marker=marker, markevery=[steps.index(s) for s in marker_steps if s in steps],\n",
        "             markersize=7)\n",
        "\n",
        "# Labels and title\n",
        "plt.xlabel('Prediction Horizon', fontsize=12)\n",
        "plt.ylabel('NRMSE', fontsize=12)\n",
        "# plt.title('NRMSE vs. Prediction Horizon (Autoregressive Forecasting)', fontsize=14, fontweight='bold')\n",
        "plt.grid(True, linestyle='--', linewidth=0.6, alpha=0.6)\n",
        "plt.legend(fontsize=9, ncol=2, loc='upper left')\n",
        "plt.tight_layout()\n",
        "plt.savefig(\"Figures/NRMSE_vs_Prediction_Horizon_AR_Rossler.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "219bcc84",
      "metadata": {},
      "outputs": [],
      "source": [
        "import matplotlib.pyplot as plt\n",
        "import seaborn as sns\n",
        "import pandas as pd\n",
        "\n",
        "target_horizon = 1000\n",
        "\n",
        "records = []\n",
        "for model_name in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    model_vals = [np.mean(entry[target_horizon]) for entry in nrmse_dict[model_name]]\n",
        "    for val in model_vals:\n",
        "        records.append({\n",
        "            \"Model\": model_name,\n",
        "            \"NRMSE\": val\n",
        "        })\n",
        "\n",
        "df = pd.DataFrame(records)\n",
        "\n",
        "# ─── PLOTTING ──────────────────────────────────────────────────────────────\n",
        "sns.set(style=\"whitegrid\")\n",
        "plt.figure(figsize=(6, 6))\n",
        "\n",
        "sns.boxplot(data=df, x='Model', y='Value', palette='Set2', showfliers=False)\n",
        "# plt.title(f'Boxplot of NRMSE at Horizon {target_horizon}')\n",
        "plt.ylabel('NRMSE')\n",
        "plt.xticks(rotation=45)\n",
        "plt.grid(True, linestyle='--', alpha=0.5)\n",
        "plt.tight_layout()\n",
        "plt.savefig(f\"BoxPlot_NRMSE_H{target_horizon}_Rossler-trigr.png\", dpi=400)\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "da920e03",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(f\"{'':<20} {'ESN':<20} {'SCR':<20} {'CRJ':<20} {'MCI-ESN':<20} {'DeepESN':<20} {'TRIGR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'T_VPT':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    mean = np.mean(VPT_dict[model])\n",
        "    std = np.std(VPT_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "\n",
        "print(f\"{'T_VPT/T_lambda':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    mean = np.mean(VPT_ratio_dict[model])\n",
        "    std = np.std(VPT_ratio_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a3218c7d",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(f\"{'':<20} {'ESN':<20} {'SCR':<20} {'CRJ':<20} {'MCI-ESN':<20} {'DeepESN':<20} {'TRIGR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'ADev':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    values = adev_dict[model]\n",
        "    mean = np.mean(values)\n",
        "    mad = np.mean(np.abs(values - mean))\n",
        "    print(f\"{mean:.2f} ± {mad:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "c0af9f32",
      "metadata": {
        "id": "c0af9f32"
      },
      "source": [
        "## Experiments on Rossler Dataset in Teacher-Forced Setting"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "818db52a",
      "metadata": {
        "id": "818db52a"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(1, 6)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "Lj6inF9bFxKh",
      "metadata": {
        "id": "Lj6inF9bFxKh"
      },
      "outputs": [],
      "source": [
        "nrmse_dict['ESN'] = []\n",
        "nrmse_dict['SCR'] = []\n",
        "nrmse_dict['CRJ'] = []\n",
        "nrmse_dict['MCI-ESN'] = []\n",
        "nrmse_dict['DeepESN'] = []\n",
        "nrmse_dict['TRIGR'] = []"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "IaSmCrJgGtVt",
      "metadata": {
        "id": "IaSmCrJgGtVt"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, rossler_traj = generate_rossler_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    rossler_traj = rossler_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(rossler_traj)\n",
        "    rossler_traj = scaler.transform(rossler_traj)\n",
        "    T_data = len(rossler_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = rossler_traj[:train_end]\n",
        "        train_target = rossler_traj[1:train_end + 1]\n",
        "        test_input = rossler_traj[train_end:-1]\n",
        "        test_target = rossler_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            # Baseline ESN\n",
        "            esn = ESN3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.92,\n",
        "                connectivity=0.2,\n",
        "                input_scale=0.6,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            esn.fit_readout(train_input, train_target, discard=100)\n",
        "            esn_preds = esn.predict_open_loop(test_input)\n",
        "            esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['ESN'].append(esn_nrmse)\n",
        "\n",
        "            # Cycle Reservoir\n",
        "            cycle_res = CR3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.8,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "            cycle_res_preds = cycle_res.predict_open_loop(test_input)\n",
        "            cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "\n",
        "            crj = CRJ3D(\n",
        "                reservoir_size=300,\n",
        "                jump=20,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.7,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            crj.fit_readout(train_input, train_target, discard=100)\n",
        "            crj_preds = crj.predict_open_loop(test_input)\n",
        "            crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "            nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "\n",
        "            mci_esn = MCI3D(\n",
        "                reservoir_size=150,\n",
        "                cycle_weight=0.6,\n",
        "                connect_weight=0.6,\n",
        "                combine_factor=0.4,\n",
        "                input_scale=0.5,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            mci_esn_preds = mci_esn.predict_open_loop(test_input)\n",
        "            mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "\n",
        "            deepesn = DeepESN3D(\n",
        "                num_layers=3,\n",
        "                reservoir_size=100,\n",
        "                spectral_radius=0.95,\n",
        "                connectivity=0.05,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.3,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "            deepesn_preds = deepesn.predict_open_loop(test_input)\n",
        "            deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_open_loop(test_input)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TRIGR'].append(trigr_nrmse)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "9395b261",
      "metadata": {
        "id": "9395b261"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean*10000:.4f} ± {std*10000:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "802acc7e",
      "metadata": {
        "id": "802acc7e"
      },
      "source": [
        "## Experiments on Chen Dataset under Autoregressive Forecasting"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "65de14a7",
      "metadata": {
        "id": "65de14a7"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_chen = 0.829\n",
        "lyapunov_time_chen = 1.0 / lle_chen\n",
        "lyapunov_time = lyapunov_time_chen\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.7, 0.75, 0.8]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "VPT_dict = defaultdict(list)\n",
        "VPT_ratio_dict = defaultdict(list)\n",
        "adev_dict = defaultdict(list)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "XoZCUmq-Ksxf",
      "metadata": {
        "id": "XoZCUmq-Ksxf"
      },
      "outputs": [],
      "source": [
        "nrmse_dict['ESN'] = []\n",
        "VPT_dict['ESN'] = []\n",
        "VPT_ratio_dict['ESN'] = []\n",
        "adev_dict['ESN'] = []\n",
        "\n",
        "nrmse_dict['SCR'] = []\n",
        "VPT_dict['SCR'] = []\n",
        "VPT_ratio_dict['SCR'] = []\n",
        "adev_dict['SCR'] = []\n",
        "\n",
        "nrmse_dict['CRJ'] = []\n",
        "VPT_dict['CRJ'] = []\n",
        "VPT_ratio_dict['CRJ'] = []\n",
        "adev_dict['CRJ'] = []\n",
        "\n",
        "nrmse_dict['MCI-ESN'] = []\n",
        "VPT_dict['MCI-ESN'] = []\n",
        "VPT_ratio_dict['MCI-ESN'] = []\n",
        "adev_dict['MCI-ESN'] = []\n",
        "\n",
        "nrmse_dict['DeepESN'] = []\n",
        "VPT_dict['DeepESN'] = []\n",
        "VPT_ratio_dict['DeepESN'] = []\n",
        "adev_dict['DeepESN'] = []\n",
        "\n",
        "nrmse_dict['TRIGR'] = []\n",
        "VPT_dict['TRIGR'] = []\n",
        "VPT_ratio_dict['TRIGR'] = []\n",
        "adev_dict['TRIGR'] = []"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c98cb9ba",
      "metadata": {
        "id": "c98cb9ba"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, chen_traj = generate_chen_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    chen_traj = chen_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(chen_traj)\n",
        "    chen_traj = scaler.transform(chen_traj)\n",
        "    T_data = len(chen_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = chen_traj[:train_end]\n",
        "        train_target = chen_traj[1:train_end + 1]\n",
        "        test_input = chen_traj[train_end:-1]\n",
        "        test_target = chen_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            # Baseline ESN\n",
        "            esn = ESN3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.92,\n",
        "                connectivity=0.3,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            esn.fit_readout(train_input, train_target, discard=100)\n",
        "            esn_preds = esn.predict_autoregressive(initial_input, num_steps)\n",
        "            esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['ESN'].append(esn_nrmse)\n",
        "            esn_VPT, esn_VPT_ratio = compute_valid_prediction_time(test_target, esn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['ESN'].append(esn_VPT)\n",
        "            VPT_ratio_dict['ESN'].append(esn_VPT_ratio)\n",
        "            esn_adev = compute_attractor_deviation(esn_preds, test_target)\n",
        "            adev_dict['ESN'].append(esn_adev)\n",
        "\n",
        "\n",
        "            # Cycle Reservoir\n",
        "            cycle_res = CR3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.95,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.3,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "            cycle_res_preds = cycle_res.predict_autoregressive(initial_input, num_steps)\n",
        "            cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "            cycle_res_VPT, cycle_res_VPT_ratio = compute_valid_prediction_time(test_target, cycle_res_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['SCR'].append(cycle_res_VPT)\n",
        "            VPT_ratio_dict['SCR'].append(cycle_res_VPT_ratio)\n",
        "            cycle_res_adev = compute_attractor_deviation(cycle_res_preds, test_target)\n",
        "            adev_dict['SCR'].append(cycle_res_adev)\n",
        "\n",
        "            crj = CRJ3D(\n",
        "                reservoir_size=300,\n",
        "                jump=10,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            crj.fit_readout(train_input, train_target, discard=100)\n",
        "            crj_preds = crj.predict_autoregressive(initial_input, num_steps)\n",
        "            crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "            nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "            crj_VPT, crj_VPT_ratio = compute_valid_prediction_time(test_target, crj_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['CRJ'].append(crj_VPT)\n",
        "            VPT_ratio_dict['CRJ'].append(crj_VPT_ratio)\n",
        "            crj_adev = compute_attractor_deviation(crj_preds, test_target)\n",
        "            adev_dict['CRJ'].append(crj_adev)\n",
        "\n",
        "            mci_esn = MCI3D(\n",
        "                reservoir_size=300,\n",
        "                cycle_weight=0.8,\n",
        "                connect_weight=1,\n",
        "                combine_factor=0.6,\n",
        "                input_scale=0.5,\n",
        "                leaking_rate=0.7,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            mci_esn_preds = mci_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "            mci_esn_VPT, mci_esn_VPT_ratio = compute_valid_prediction_time(test_target, mci_esn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['MCI-ESN'].append(mci_esn_VPT)\n",
        "            VPT_ratio_dict['MCI-ESN'].append(mci_esn_VPT_ratio)\n",
        "            mci_esn_adev = compute_attractor_deviation(mci_esn_preds, test_target)\n",
        "            adev_dict['MCI-ESN'].append(mci_esn_adev)\n",
        "\n",
        "            deepesn = DeepESN3D(\n",
        "                num_layers=3,\n",
        "                reservoir_size=100,\n",
        "                spectral_radius=0.95,\n",
        "                connectivity=0.01,\n",
        "                input_scale=0.2,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "            deepesn_preds = deepesn.predict_autoregressive(initial_input, num_steps)\n",
        "            deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "            deepesn_VPT, deepesn_VPT_ratio = compute_valid_prediction_time(test_target, deepesn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['DeepESN'].append(deepesn_VPT)\n",
        "            VPT_ratio_dict['DeepESN'].append(deepesn_VPT_ratio)\n",
        "            deepesn_adev = compute_attractor_deviation(deepesn_preds, test_target)\n",
        "            adev_dict['DeepESN'].append(deepesn_adev)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                    reservoir_size=300,\n",
        "                    n_astrocytes = 20,\n",
        "                    input_dim=3,\n",
        "                    rho_star=0.95,\n",
        "                    alpha=0.65,\n",
        "                    tau_c=200,\n",
        "                    eta=0.9,\n",
        "                    D_diff=0.15,\n",
        "                    theta=0.3,\n",
        "                    gamma_glia=0.05,\n",
        "                    input_scale=0.5,\n",
        "                    ridge_alpha=1e-6,\n",
        "                    seed=seed\n",
        "                )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TRIGR'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['TRIGR'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['TRIGR'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['TRIGR'].append(trigr_adev)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "02b9a386",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c2e1150e",
      "metadata": {},
      "outputs": [],
      "source": [
        "plot_len = 1000\n",
        "steps = list(range(10, plot_len + 1, 10))\n",
        "marker_steps = [10, 200, 400, 600, 800, 1000]\n",
        "\n",
        "models = {\n",
        "    'ESN': esn_nrmse,\n",
        "    'SCR': cycle_res_nrmse,\n",
        "    'CRJ': crj_nrmse,\n",
        "    'MCI-ESN': mci_esn_nrmse,\n",
        "    'DeepESN': deepesn_nrmse,\n",
        "    'TRIGR': trigr_nrmse\n",
        "}\n",
        "\n",
        "# Assign a unique marker and color style for each\n",
        "colors = plt.cm.tab10.colors\n",
        "markers = ['o', 's', 'D', '^', 'v', 'P', 'X']\n",
        "\n",
        "plt.figure(figsize=(5, 6))\n",
        "\n",
        "for i, (name, data) in enumerate(models.items()):\n",
        "    values = [np.mean(data[s]) for s in steps]\n",
        "    color = colors[i % len(colors)]\n",
        "    marker = markers[i % len(markers)]\n",
        "    values = []\n",
        "\n",
        "    for horizon in all_horizons:\n",
        "        # Get all NRMSE values across all runs for this model and this horizon\n",
        "        all_vals = []\n",
        "        for run in nrmse_dict[name]:\n",
        "            all_vals.extend([np.mean(run[horizon])])\n",
        "        values.append(np.mean(all_vals))\n",
        "\n",
        "    # Plot with markers so legend also shows them\n",
        "    plt.plot(steps, values, label=name, linewidth=2.2, color=color,\n",
        "             marker=marker, markevery=[steps.index(s) for s in marker_steps if s in steps],\n",
        "             markersize=7)\n",
        "\n",
        "# Labels and title\n",
        "plt.xlabel('Prediction Horizon', fontsize=12)\n",
        "plt.ylabel('NRMSE', fontsize=12)\n",
        "# plt.title('NRMSE vs. Prediction Horizon (Autoregressive Forecasting)', fontsize=14, fontweight='bold')\n",
        "plt.grid(True, linestyle='--', linewidth=0.6, alpha=0.6)\n",
        "plt.legend(fontsize=9, ncol=2, loc='upper left')\n",
        "plt.tight_layout()\n",
        "plt.savefig(\"Figures/NRMSE_vs_Prediction_Horizon_AR_Chen.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "758420f4",
      "metadata": {},
      "outputs": [],
      "source": [
        "import matplotlib.pyplot as plt\n",
        "import seaborn as sns\n",
        "import pandas as pd\n",
        "\n",
        "target_horizon = 1000\n",
        "\n",
        "records = []\n",
        "for model_name in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    model_vals = [np.mean(entry[target_horizon]) for entry in nrmse_dict[model_name]]\n",
        "    for val in model_vals:\n",
        "        records.append({\n",
        "            \"Model\": model_name,\n",
        "            \"NRMSE\": val\n",
        "        })\n",
        "\n",
        "df = pd.DataFrame(records)\n",
        "\n",
        "# ─── PLOTTING ──────────────────────────────────────────────────────────────\n",
        "sns.set(style=\"whitegrid\")\n",
        "plt.figure(figsize=(6, 6))\n",
        "\n",
        "sns.boxplot(data=df, x='Model', y='Value', palette='Set2', showfliers=False)\n",
        "# plt.title(f'Boxplot of NRMSE at Horizon {target_horizon}')\n",
        "plt.ylabel('NRMSE')\n",
        "plt.xticks(rotation=45)\n",
        "plt.grid(True, linestyle='--', alpha=0.5)\n",
        "plt.tight_layout()\n",
        "plt.savefig(f\"BoxPlot_NRMSE_H{target_horizon}_Chen-trigr.png\", dpi=400)\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "637f62a9",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(f\"{'':<20} {'ESN':<20} {'SCR':<20} {'CRJ':<20} {'MCI-ESN':<20} {'DeepESN':<20} {'TRIGR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'T_VPT':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    mean = np.mean(VPT_dict[model])\n",
        "    std = np.std(VPT_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "\n",
        "print(f\"{'T_VPT/T_lambda':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    mean = np.mean(VPT_ratio_dict[model])\n",
        "    std = np.std(VPT_ratio_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "777f28ae",
      "metadata": {},
      "outputs": [],
      "source": [
        "print(f\"{'':<20} {'ESN':<20} {'SCR':<20} {'CRJ':<20} {'MCI-ESN':<20} {'DeepESN':<20} {'TRIGR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'ADev':<20}\", end='')\n",
        "for model in ['ESN', 'SCR', 'CRJ', 'MCI-ESN', 'DeepESN', 'TRIGR']:\n",
        "    values = adev_dict[model]\n",
        "    mean = np.mean(values)\n",
        "    mad = np.mean(np.abs(values - mean))\n",
        "    print(f\"{mean:.2f} ± {mad:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "a2b6764a",
      "metadata": {
        "id": "a2b6764a"
      },
      "source": [
        "## Experiments on Chen Dataset in Teacher-Forced Setting"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "0698254d",
      "metadata": {
        "id": "0698254d"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(1, 6)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "E1CmBX1bMzDU",
      "metadata": {
        "id": "E1CmBX1bMzDU"
      },
      "outputs": [],
      "source": [
        "nrmse_dict['ESN'] = []\n",
        "nrmse_dict['SCR'] = []\n",
        "nrmse_dict['CRJ'] = []\n",
        "nrmse_dict['MCI-ESN'] = []\n",
        "nrmse_dict['DeepESN'] = []\n",
        "nrmse_dict['TRIGR'] = []"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "bf768f9b",
      "metadata": {
        "id": "bf768f9b"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, chen_traj = generate_chen_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    chen_traj = chen_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(chen_traj)\n",
        "    chen_traj = scaler.transform(chen_traj)\n",
        "    T_data = len(chen_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = chen_traj[:train_end]\n",
        "        train_target = chen_traj[1:train_end + 1]\n",
        "        test_input = chen_traj[train_end:-1]\n",
        "        test_target = chen_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            # Baseline ESN\n",
        "            esn = ESN3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.92,\n",
        "                connectivity=0.3,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            esn.fit_readout(train_input, train_target, discard=100)\n",
        "            esn_preds = esn.predict_autoregressive(initial_input, num_steps)\n",
        "            esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['ESN'].append(esn_nrmse)\n",
        "\n",
        "            # Cycle Reservoir\n",
        "            cycle_res = CR3D(\n",
        "                reservoir_size=300,\n",
        "                spectral_radius=0.95,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.3,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "            cycle_res_preds = cycle_res.predict_autoregressive(initial_input, num_steps)\n",
        "            cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "\n",
        "            crj = CRJ3D(\n",
        "                reservoir_size=300,\n",
        "                jump=10,\n",
        "                spectral_radius=0.98,\n",
        "                input_scale=0.8,\n",
        "                leaking_rate=0.5,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            crj.fit_readout(train_input, train_target, discard=100)\n",
        "            crj_preds = crj.predict_autoregressive(initial_input, num_steps)\n",
        "            crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "            nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "\n",
        "            mci_esn = MCI3D(\n",
        "                reservoir_size=300,\n",
        "                cycle_weight=0.8,\n",
        "                connect_weight=1,\n",
        "                combine_factor=0.6,\n",
        "                input_scale=0.5,\n",
        "                leaking_rate=0.7,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            mci_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            mci_esn_preds = mci_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "\n",
        "            deepesn = DeepESN3D(\n",
        "                num_layers=3,\n",
        "                reservoir_size=100,\n",
        "                spectral_radius=0.95,\n",
        "                connectivity=0.01,\n",
        "                input_scale=0.2,\n",
        "                leaking_rate=0.9,\n",
        "                ridge_alpha=1e-6,\n",
        "                seed=seed\n",
        "            )\n",
        "            deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "            deepesn_preds = deepesn.predict_autoregressive(initial_input, num_steps)\n",
        "            deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TRIGR'].append(trigr_nrmse)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "7d772bfe",
      "metadata": {
        "id": "7d772bfe"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean*10000:.4f} ± {std*10000:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a54c9196",
      "metadata": {
        "id": "a54c9196"
      },
      "outputs": [],
      "source": [
        "import matplotlib.pyplot as plt\n",
        "import numpy as np\n",
        "\n",
        "plot_len = 1000\n",
        "steps = list(range(10, plot_len + 1, 10))\n",
        "marker_steps = [10, 200, 400, 600, 800, 1000]\n",
        "\n",
        "models = {\n",
        "    'ESN': esn_nrmse,\n",
        "    'SCR': cycle_res_nrmse,\n",
        "    'CRJ': crj_nrmse,\n",
        "    'MCI-ESN': mci_esn_nrmse,\n",
        "    'DeepESN': deepesn_nrmse,\n",
        "    'TRIGR': trigr_nrmse\n",
        "}\n",
        "\n",
        "# Assign a unique marker and color style for each\n",
        "colors = plt.cm.tab10.colors\n",
        "markers = ['o', 's', 'D', '^', 'v', 'P', 'X']\n",
        "\n",
        "plt.figure(figsize=(5, 6))\n",
        "\n",
        "for i, (name, data) in enumerate(models.items()):\n",
        "    values = [np.mean(data[s]) for s in steps]\n",
        "    color = colors[i % len(colors)]\n",
        "    marker = markers[i % len(markers)]\n",
        "    values = []\n",
        "\n",
        "    for horizon in all_horizons:\n",
        "        # Get all NRMSE values across all runs for this model and this horizon\n",
        "        all_vals = []\n",
        "        for run in nrmse_dict[name]:\n",
        "            all_vals.extend([np.mean(run[horizon])])\n",
        "        values.append(np.mean(all_vals))\n",
        "\n",
        "    # Plot with markers so legend also shows them\n",
        "    plt.plot(steps, values, label=name, linewidth=2.2, color=color,\n",
        "             marker=marker, markevery=[steps.index(s) for s in marker_steps if s in steps],\n",
        "             markersize=7)\n",
        "\n",
        "# Labels and title\n",
        "plt.xlabel('Prediction Horizon', fontsize=12)\n",
        "plt.ylabel('NRMSE', fontsize=12)\n",
        "# plt.title('NRMSE vs. Prediction Horizon (Autoregressive Forecasting)', fontsize=14, fontweight='bold')\n",
        "plt.grid(True, linestyle='--', linewidth=0.6, alpha=0.6)\n",
        "plt.legend(fontsize=9, ncol=2, loc='upper left')\n",
        "plt.tight_layout()\n",
        "plt.savefig(\"Figures/NRMSE_vs_Prediction_Horizon_TF_Chen.png\", dpi=400, bbox_inches='tight')\n",
        "plt.show()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "ad1d603e",
      "metadata": {
        "id": "ad1d603e"
      },
      "source": [
        "## Ablation over Reservoir Dynamics"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "d2aee0f4",
      "metadata": {
        "id": "d2aee0f4"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_lorenz = 0.9\n",
        "lyapunov_time_lorenz = 1.0 / lle_lorenz\n",
        "lyapunov_time = lyapunov_time_lorenz\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.7,0.75,0.8]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "VPT_dict = defaultdict(list)\n",
        "VPT_ratio_dict = defaultdict(list)\n",
        "adev_dict = defaultdict(list)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "7d6705af",
      "metadata": {
        "id": "7d6705af"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, lorenz_traj = generate_lorenz_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(lorenz_traj)\n",
        "    lorenz_traj = scaler.transform(lorenz_traj)\n",
        "    T_data = len(lorenz_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = lorenz_traj[:train_end]\n",
        "        train_target = lorenz_traj[1:train_end + 1]\n",
        "        test_input = lorenz_traj[train_end:-1]\n",
        "        test_target = lorenz_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['Full'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['Full'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['Full'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['Full'].append(trigr_adev)\n",
        "\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['QL'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['QL'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['QL'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['QL'].append(trigr_adev)\n",
        "\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['AF'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['AF'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['AF'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['AF'].append(trigr_adev)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['CF'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['CF'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['CF'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['CF'].append(trigr_adev)\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['STS'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['STS'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['STS'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['STS'].append(trigr_adev)\n",
        "\n",
        "\n",
        "            trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                # sizes\n",
        "                reservoir_size=300,          # N\n",
        "                input_dim=3,\n",
        "                astro_nx=20,                 # grid width\n",
        "                astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                rel_channels=128,            # P\n",
        "\n",
        "                # kinetics / rates\n",
        "                leak_x=0.45,                 # λ\n",
        "                rate_c=0.05,                 # α\n",
        "                rate_g=0.05,                 # ρ\n",
        "                diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                # neuron bias\n",
        "                bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                # nonlinearities (F, Γ)\n",
        "                c_max=1.0,                   # max Ca\n",
        "                k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                theta_c=0.0,                 # midpoint for F\n",
        "                k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                theta_g=0.0,                 # midpoint for Γ\n",
        "                zeta=0.0,                    # tonic drive (scalar)\n",
        "                g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                # input map\n",
        "                input_scale=0.2,\n",
        "\n",
        "                # randomization / sparsity\n",
        "                W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                block_scale=1.0,             # base std for random blocks\n",
        "                eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                # spectral safety targets (row budgets, both < 1)\n",
        "                rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                # read-out\n",
        "                ridge_alpha=1e-6,\n",
        "                use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "            )\n",
        "            trigr.fit_readout(train_input, train_target, discard=100)\n",
        "            trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "            trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "            nrmse_dict['NCR'].append(trigr_nrmse)\n",
        "            trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['NCR'].append(trigr_VPT)\n",
        "            VPT_ratio_dict['NCR'].append(trigr_VPT_ratio)\n",
        "            trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "            adev_dict['NCR'].append(trigr_adev)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "ce22412c",
      "metadata": {
        "id": "ce22412c"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'Full':<17} {'QL':<17} {'AF':<17} {'CF':<17} {'STS':<17} {'NCR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    vals1 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict['Full']]\n",
        "    vals2 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict['QL']]\n",
        "    vals3 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict['AF']]\n",
        "    vals4 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict['CF']]\n",
        "    vals5 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict['STS']]\n",
        "    vals6 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict['NCR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [vals1, vals2, vals3, vals4, vals5,vals6]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()\n",
        "\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20}{'Full':<20} {'QL':<20} {'AF':<20} {'CF':<20} {'STS':<20} {'NCR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'T_VPT':<20}\", end='')\n",
        "for model in ['Full','QL','AF','CF','STS','NCR']:\n",
        "    mean = np.mean(VPT_dict[model])\n",
        "    std = np.std(VPT_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "\n",
        "print(f\"{'T_VPT/T_lambda':<20}\", end='')\n",
        "for model in ['Full','QL','AF','CF','STS','NCR']:\n",
        "    mean = np.mean(VPT_ratio_dict[model])\n",
        "    std = np.std(VPT_ratio_dict[model])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20}{'Full':<20} {'QL':<20} {'AF':<20} {'CF':<20} {'STS':<20} {'NCR':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'SDQ':<20}\", end='')\n",
        "for model in ['Full','QL','AF','CF','STS','NCR']:\n",
        "    values = adev_dict[model]\n",
        "    mean = np.mean(values)\n",
        "    mad = np.mean(np.abs(values - mean))\n",
        "    print(f\"{mean:.2f} ± {mad:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "7a8dd613",
      "metadata": {
        "id": "7a8dd613"
      },
      "source": [
        "## Ablation over Spectral Radius"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "2c5fb8ef",
      "metadata": {
        "id": "2c5fb8ef"
      },
      "outputs": [],
      "source": [
        "for rho_star in [0.7, 0.9, 0.92, 0.99, 1.05]:\n",
        "    nrmse_dict[rho_star] = []\n",
        "    VPT_dict[rho_star] = []\n",
        "    VPT_ratio_dict[rho_star] = []\n",
        "    adev_dict[rho_star] = []\n",
        "    for initial_state in initial_states:\n",
        "        t_vals, lorenz_traj = generate_lorenz_data(\n",
        "        initial_state=initial_state,\n",
        "        tmax=tmax,\n",
        "        dt=dt\n",
        "        )\n",
        "\n",
        "        washout = 2000\n",
        "        t_vals = t_vals[washout:]\n",
        "        lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "        scaler = MinMaxScaler()\n",
        "        scaler.fit(lorenz_traj)\n",
        "        lorenz_traj = scaler.transform(lorenz_traj)\n",
        "        T_data = len(lorenz_traj)\n",
        "\n",
        "        for train_frac in train_fracs:\n",
        "            train_end = int(train_frac * (T_data - 1))\n",
        "            train_input = lorenz_traj[:train_end]\n",
        "            train_target = lorenz_traj[1:train_end + 1]\n",
        "            test_input = lorenz_traj[train_end:-1]\n",
        "            test_target = lorenz_traj[train_end + 1:]\n",
        "            n_test_steps = len(test_input)\n",
        "            initial_in = test_input[0]\n",
        "\n",
        "            for seed in seeds:\n",
        "                trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                    # sizes\n",
        "                    reservoir_size=300,          # N\n",
        "                    input_dim=3,\n",
        "                    astro_nx=20,                 # grid width\n",
        "                    astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                    rel_channels=128,            # P\n",
        "\n",
        "                    # kinetics / rates\n",
        "                    leak_x=0.45,                 # λ\n",
        "                    rate_c=0.05,                 # α\n",
        "                    rate_g=0.05,                 # ρ\n",
        "                    diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                    # neuron bias\n",
        "                    bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                    # nonlinearities (F, Γ)\n",
        "                    c_max=1.0,                   # max Ca\n",
        "                    k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                    theta_c=0.0,                 # midpoint for F\n",
        "                    k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                    theta_g=0.0,                 # midpoint for Γ\n",
        "                    zeta=0.0,                    # tonic drive (scalar)\n",
        "                    g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                    delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                    # input map\n",
        "                    input_scale=0.2,\n",
        "\n",
        "                    # randomization / sparsity\n",
        "                    W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                    footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                    block_scale=1.0,             # base std for random blocks\n",
        "                    eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                    # spectral safety targets (row budgets, both < 1)\n",
        "                    rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                    rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                    # read-out\n",
        "                    ridge_alpha=1e-6,\n",
        "                    use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                    feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "                )\n",
        "                trigr.fit_readout(train_input, train_target, discard=100)\n",
        "                trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "                trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "                nrmse_dict[rho_star].append(trigr_nrmse)\n",
        "                trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "                VPT_dict[rho_star].append(trigr_VPT)\n",
        "                VPT_ratio_dict[rho_star].append(trigr_VPT_ratio)\n",
        "                trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "                adev_dict[rho_star].append(trigr_adev)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a0d28617",
      "metadata": {
        "id": "a0d28617"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'0.7':<17} {'0.9':<17} {'0.92':<17} {'0.99':<17} {'1.05':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    vals1 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.7]]\n",
        "    vals2 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.9]]\n",
        "    vals3 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.92]]\n",
        "    vals4 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.99]]\n",
        "    vals5 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[1.05]]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [vals1, vals2, vals3, vals4, vals5]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()\n",
        "\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20} {'0.7':<20} {'0.9':<20} {'0.92':<20} {'0.99':<20} {'1.05':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'T_VPT':<20}\", end='')\n",
        "for rho_star in [0.7, 0.9, 0.92, 0.99, 1.05]:\n",
        "    mean = np.mean(VPT_dict[rho_star])\n",
        "    std = np.std(VPT_dict[rho_star])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "\n",
        "print(f\"{'T_VPT/T_lambda':<20}\", end='')\n",
        "for rho_star in [0.7, 0.9, 0.92, 0.99, 1.05]:\n",
        "    mean = np.mean(VPT_ratio_dict[rho_star])\n",
        "    std = np.std(VPT_ratio_dict[rho_star])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20} {'0.7':<20} {'0.9':<20} {'0.92':<20} {'0.99':<20} {'1.05':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'ADev':<20}\", end='')\n",
        "for rho_star in [0.7, 0.9, 0.92, 0.99, 1.05]:\n",
        "    values = adev_dict[rho_star]\n",
        "    mean = np.mean(values)\n",
        "    mad = np.mean(np.abs(values - mean))\n",
        "    print(f\"{mean:.2f} ± {mad:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "83fdbe33",
      "metadata": {
        "id": "83fdbe33"
      },
      "source": [
        "## Ablation over input scale\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "feb940cd",
      "metadata": {
        "id": "feb940cd"
      },
      "outputs": [],
      "source": [
        "for input_scale in [0.3,0.5,0.7,0.9,1.0]:\n",
        "    nrmse_dict[input_scale] = []\n",
        "    VPT_dict[input_scale] = []\n",
        "    VPT_ratio_dict[input_scale] = []\n",
        "    adev_dict[input_scale] = []\n",
        "    for initial_state in initial_states:\n",
        "        t_vals, lorenz_traj = generate_lorenz_data(\n",
        "        initial_state=initial_state,\n",
        "        tmax=tmax,\n",
        "        dt=dt\n",
        "        )\n",
        "\n",
        "        washout = 2000\n",
        "        t_vals = t_vals[washout:]\n",
        "        lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "        scaler = MinMaxScaler()\n",
        "        scaler.fit(lorenz_traj)\n",
        "        lorenz_traj = scaler.transform(lorenz_traj)\n",
        "        T_data = len(lorenz_traj)\n",
        "\n",
        "        for train_frac in train_fracs:\n",
        "            train_end = int(train_frac * (T_data - 1))\n",
        "            train_input = lorenz_traj[:train_end]\n",
        "            train_target = lorenz_traj[1:train_end + 1]\n",
        "            test_input = lorenz_traj[train_end:-1]\n",
        "            test_target = lorenz_traj[train_end + 1:]\n",
        "            n_test_steps = len(test_input)\n",
        "            initial_in = test_input[0]\n",
        "\n",
        "            for seed in seeds:\n",
        "                trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                    # sizes\n",
        "                    reservoir_size=300,          # N\n",
        "                    input_dim=3,\n",
        "                    astro_nx=20,                 # grid width\n",
        "                    astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                    rel_channels=128,            # P\n",
        "\n",
        "                    # kinetics / rates\n",
        "                    leak_x=0.45,                 # λ\n",
        "                    rate_c=0.05,                 # α\n",
        "                    rate_g=0.05,                 # ρ\n",
        "                    diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                    # neuron bias\n",
        "                    bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                    # nonlinearities (F, Γ)\n",
        "                    c_max=1.0,                   # max Ca\n",
        "                    k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                    theta_c=0.0,                 # midpoint for F\n",
        "                    k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                    theta_g=0.0,                 # midpoint for Γ\n",
        "                    zeta=0.0,                    # tonic drive (scalar)\n",
        "                    g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                    delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                    # input map\n",
        "                    input_scale=0.2,\n",
        "\n",
        "                    # randomization / sparsity\n",
        "                    W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                    footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                    block_scale=1.0,             # base std for random blocks\n",
        "                    eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                    # spectral safety targets (row budgets, both < 1)\n",
        "                    rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                    rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                    # read-out\n",
        "                    ridge_alpha=1e-6,\n",
        "                    use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                    feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "                )\n",
        "                trigr.fit_readout(train_input, train_target, discard=100)\n",
        "                trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "                trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "                nrmse_dict[input_scale].append(trigr_nrmse)\n",
        "                trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "                VPT_dict[input_scale].append(trigr_VPT)\n",
        "                VPT_ratio_dict[input_scale].append(trigr_VPT_ratio)\n",
        "                trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "                adev_dict[input_scale].append(trigr_adev)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "dda5d236",
      "metadata": {
        "id": "dda5d236"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'0.3':<17} {'0.5':<17} {'0.7':<17} {'0.9':<17} {'1.0':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    vals1 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.3]]\n",
        "    vals2 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.5]]\n",
        "    vals3 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.7]]\n",
        "    vals4 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.9]]\n",
        "    vals5 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[1.0]]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [vals1, vals2, vals3, vals4, vals5]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()\n",
        "\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20} {'0.3':<20} {'0.5':<20} {'0.7':<20} {'0.9':<20} {'1.0':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'T_VPT':<20}\", end='')\n",
        "for input_scale in [0.3, 0.5, 0.7, 0.9, 1.0]:\n",
        "    mean = np.mean(VPT_dict[input_scale])\n",
        "    std = np.std(VPT_dict[input_scale])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "\n",
        "print(f\"{'T_VPT/T_lambda':<20}\", end='')\n",
        "for input_scale in [0.3, 0.5, 0.7, 0.9, 1.0]:\n",
        "    mean = np.mean(VPT_ratio_dict[input_scale])\n",
        "    std = np.std(VPT_ratio_dict[input_scale])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20} {'0.3':<20} {'0.5':<20} {'0.7':<20} {'0.9':<20} {'1.0':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'ADev':<20}\", end='')\n",
        "for input_scale in [0.3, 0.5, 0.7, 0.9, 1.0]:\n",
        "    values = adev_dict[input_scale]\n",
        "    mean = np.mean(values)\n",
        "    mad = np.mean(np.abs(values - mean))\n",
        "    print(f\"{mean:.2f} ± {mad:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "dde2323b",
      "metadata": {
        "id": "dde2323b"
      },
      "source": [
        "## Ablation over leaking rate\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "74a793e2",
      "metadata": {
        "id": "74a793e2"
      },
      "outputs": [],
      "source": [
        "for alpha in [0.5,0.7,0.8,0.9,1.0]:\n",
        "    nrmse_dict[alpha] = []\n",
        "    VPT_dict[alpha] = []\n",
        "    VPT_ratio_dict[alpha] = []\n",
        "    adev_dict[alpha] = []\n",
        "    for initial_state in initial_states:\n",
        "        t_vals, lorenz_traj = generate_lorenz_data(\n",
        "        initial_state=initial_state,\n",
        "        tmax=tmax,\n",
        "        dt=dt\n",
        "        )\n",
        "\n",
        "        washout = 2000\n",
        "        t_vals = t_vals[washout:]\n",
        "        lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "        scaler = MinMaxScaler()\n",
        "        scaler.fit(lorenz_traj)\n",
        "        lorenz_traj = scaler.transform(lorenz_traj)\n",
        "        T_data = len(lorenz_traj)\n",
        "\n",
        "        for train_frac in train_fracs:\n",
        "            train_end = int(train_frac * (T_data - 1))\n",
        "            train_input = lorenz_traj[:train_end]\n",
        "            train_target = lorenz_traj[1:train_end + 1]\n",
        "            test_input = lorenz_traj[train_end:-1]\n",
        "            test_target = lorenz_traj[train_end + 1:]\n",
        "            n_test_steps = len(test_input)\n",
        "            initial_in = test_input[0]\n",
        "\n",
        "            for seed in seeds:\n",
        "                trigr = GliaNeuronTripartiteReservoirESN(\n",
        "                    # sizes\n",
        "                    reservoir_size=300,          # N\n",
        "                    input_dim=3,\n",
        "                    astro_nx=20,                 # grid width\n",
        "                    astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "                    rel_channels=128,            # P\n",
        "\n",
        "                    # kinetics / rates\n",
        "                    leak_x=0.45,                 # λ\n",
        "                    rate_c=0.05,                 # α\n",
        "                    rate_g=0.05,                 # ρ\n",
        "                    diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "                    # neuron bias\n",
        "                    bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "                    # nonlinearities (F, Γ)\n",
        "                    c_max=1.0,                   # max Ca\n",
        "                    k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "                    theta_c=0.0,                 # midpoint for F\n",
        "                    k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "                    theta_g=0.0,                 # midpoint for Γ\n",
        "                    zeta=0.0,                    # tonic drive (scalar)\n",
        "                    g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "                    delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "                    # input map\n",
        "                    input_scale=0.2,\n",
        "\n",
        "                    # randomization / sparsity\n",
        "                    W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "                    footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "                    block_scale=1.0,             # base std for random blocks\n",
        "                    eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "                    # spectral safety targets (row budgets, both < 1)\n",
        "                    rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "                    rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "                    # read-out\n",
        "                    ridge_alpha=1e-6,\n",
        "                    use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "                    feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "                )\n",
        "                trigr.fit_readout(train_input, train_target, discard=100)\n",
        "                trigr_preds = trigr.predict_autoregressive(initial_input, num_steps)\n",
        "                trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "                nrmse_dict[alpha].append(trigr_nrmse)\n",
        "                trigr_VPT, trigr_VPT_ratio = compute_valid_prediction_time(test_target, trigr_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "                VPT_dict[alpha].append(trigr_VPT)\n",
        "                VPT_ratio_dict[alpha].append(trigr_VPT_ratio)\n",
        "                trigr_adev = compute_attractor_deviation(trigr_preds, test_target)\n",
        "                adev_dict[alpha].append(trigr_adev)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "92d80419",
      "metadata": {
        "id": "92d80419"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'0.5':<17} {'0.7':<17} {'0.8':<17} {'0.9':<17} {'1.0':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    vals1 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.5]]\n",
        "    vals2 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.7]]\n",
        "    vals3 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.8]]\n",
        "    vals4 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[0.9]]\n",
        "    vals5 = [np.mean(nrmse[horizon]) for nrmse in nrmse_dict[1.0]]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [vals1, vals2, vals3, vals4, vals5]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()\n",
        "\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20} {'0.5':<20} {'0.7':<20} {'0.8':<20} {'0.9':<20} {'1.0':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'T_VPT':<20}\", end='')\n",
        "for alpha in [0.5, 0.7, 0.8, 0.9, 1.0]:\n",
        "    mean = np.mean(VPT_dict[alpha])\n",
        "    std = np.std(VPT_dict[alpha])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "\n",
        "print(f\"{'T_VPT/T_lambda':<20}\", end='')\n",
        "for alpha in [0.5, 0.7, 0.8, 0.9, 1.0]:\n",
        "    mean = np.mean(VPT_ratio_dict[alpha])\n",
        "    std = np.std(VPT_ratio_dict[alpha])\n",
        "    print(f\"{mean:.3f} ± {std:.2f}\".ljust(20), end='')\n",
        "print()\n",
        "print()\n",
        "\n",
        "print(f\"{'':<20} {'0.5':<20} {'0.7':<20} {'0.8':<20} {'0.9':<20} {'1.0':<20}\")\n",
        "print(\"-\" * 160)\n",
        "\n",
        "print(f\"{'ADev':<20}\", end='')\n",
        "for alpha in [0.5, 0.7, 0.8, 0.9, 1.0]:\n",
        "    values = adev_dict[alpha]\n",
        "    mean = np.mean(values)\n",
        "    mad = np.mean(np.abs(values - mean))\n",
        "    print(f\"{mean:.2f} ± {mad:.2f}\".ljust(20), end='')\n",
        "print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "d8719c3c",
      "metadata": {
        "id": "d8719c3c"
      },
      "source": [
        "# MIT-BIH Dataset"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "54b46a85",
      "metadata": {
        "id": "54b46a85"
      },
      "outputs": [],
      "source": [
        "import wfdb\n",
        "\n",
        "# Download and load record and annotations for patient #100\n",
        "record = wfdb.rdrecord('100', sampfrom=0, sampto=25002, pn_dir='mitdb')  # first 20,000 samples\n",
        "annotation = wfdb.rdann('100', 'atr', sampfrom=0, sampto=25002, pn_dir='mitdb')"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "7a0e8cf6",
      "metadata": {
        "id": "7a0e8cf6"
      },
      "outputs": [],
      "source": [
        "# Get input signal u(t) from the first channel\n",
        "u = record.p_signal[:, 0]\n",
        "u"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "93538ea2",
      "metadata": {
        "id": "93538ea2"
      },
      "outputs": [],
      "source": [
        "# Normalize input\n",
        "u_min = np.min(u)\n",
        "u_max = np.max(u)\n",
        "u_norm = (u - u_min) / (u_max - u_min)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "6dfcd0fb",
      "metadata": {
        "id": "6dfcd0fb"
      },
      "outputs": [],
      "source": [
        "fs = record.fs  # sampling frequency (should be 360 Hz)\n",
        "t_vals = np.arange(len(u_norm)) / fs"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "ef734865",
      "metadata": {
        "id": "ef734865"
      },
      "outputs": [],
      "source": [
        "emb_dim = 3\n",
        "# inputs = u_norm\n",
        "inputs = create_delay_embedding(u_norm, emb_dim)\n",
        "\n",
        "# Create target array (heartbeat locations)\n",
        "targets = np.zeros(len(u_norm))\n",
        "targets[annotation.sample] = 1  # mark annotations as 1 (heartbeat)\n",
        "targets = create_delay_embedding(targets, emb_dim)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "938389fc",
      "metadata": {
        "id": "938389fc"
      },
      "outputs": [],
      "source": [
        "data_size = len(inputs)\n",
        "train_size = 15000\n",
        "train_input = inputs[:train_size]\n",
        "train_target = targets[:train_size]\n",
        "test_input = inputs[train_size+1:]\n",
        "test_target = targets[train_size+1:]\n",
        "test_size = len(test_input)\n",
        "print(f\"Total samples: {data_size}, train size: {train_size}, test size: {test_size}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "f2f85de1",
      "metadata": {
        "id": "f2f85de1"
      },
      "outputs": [],
      "source": [
        "all_horizons = [300, 600, 1000]\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    esn = ESN3D(\n",
        "        reservoir_size=300,\n",
        "        spectral_radius=0.99,\n",
        "        connectivity=0.05,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    esn_preds = esn.predict_open_loop(test_input)\n",
        "    esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['ESN'].append(esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    cycle_res = CR3D(\n",
        "        reservoir_size=300,\n",
        "        cycle_weight = 0.8,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    cycle_res.fit_readout(train_input, train_target, discard=5000)\n",
        "    cycle_res_preds = cycle_res.predict_open_loop(test_input)\n",
        "    cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    crj = CRJ3D(\n",
        "        reservoir_size=300,\n",
        "        edge_weight=0.8,\n",
        "        jump=15,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    crj.fit_readout(train_input, train_target, discard=5000)\n",
        "    crj_preds = crj.predict_open_loop(test_input)\n",
        "    crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "    nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    mci_esn = MCI3D(\n",
        "        reservoir_size=300,\n",
        "        cycle_weight=0.9,\n",
        "        connect_weight=0.9,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        combine_factor=0.5,\n",
        "        v1=0.5, v2=0.5,\n",
        "        seed=seed\n",
        "    )\n",
        "    mci_esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    mci_esn_preds = mci_esn.predict_open_loop(test_input)\n",
        "    mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    deepesn = DeepESN3D(\n",
        "        num_layers=3,\n",
        "        reservoir_size=100,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    deepesn.fit_readout(train_input, train_target, discard=5000)\n",
        "    deepesn_preds = deepesn.predict_open_loop(test_input)\n",
        "    deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    trigr = GliaNeuronTripartiteReservoirESN(\n",
        "        # sizes\n",
        "        reservoir_size=300,          # N\n",
        "        input_dim=3,\n",
        "        astro_nx=20,                 # grid width\n",
        "        astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "        rel_channels=128,            # P\n",
        "\n",
        "        # kinetics / rates\n",
        "        leak_x=0.45,                 # λ\n",
        "        rate_c=0.05,                 # α\n",
        "        rate_g=0.05,                 # ρ\n",
        "        diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "        # neuron bias\n",
        "        bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "        # nonlinearities (F, Γ)\n",
        "        c_max=1.0,                   # max Ca\n",
        "        k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "        theta_c=0.0,                 # midpoint for F\n",
        "        k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "        theta_g=0.0,                 # midpoint for Γ\n",
        "        zeta=0.0,                    # tonic drive (scalar)\n",
        "        g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "        delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "        # input map\n",
        "        input_scale=0.2,\n",
        "\n",
        "        # randomization / sparsity\n",
        "        W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "        footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "        block_scale=1.0,             # base std for random blocks\n",
        "        eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "        # spectral safety targets (row budgets, both < 1)\n",
        "        rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "        rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "        # read-out\n",
        "        ridge_alpha=1e-6,\n",
        "        use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "        feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "    )\n",
        "    trigr.fit_readout(train_input, train_target, discard=5000)\n",
        "    trigr_preds = trigr.predict_open_loop(test_input)\n",
        "    trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TRIGR'].append(trigr_nrmse)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "337c012a",
      "metadata": {
        "id": "337c012a"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in all_horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "a39c1e20",
      "metadata": {
        "id": "a39c1e20"
      },
      "source": [
        "# Sunspot Dataset"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "3232502c",
      "metadata": {
        "id": "3232502c"
      },
      "outputs": [],
      "source": [
        "import pandas as pd\n",
        "file_path = 'dataset/SN_m_tot_V2.0.csv'\n",
        "\n",
        "df = pd.read_csv(file_path, sep=';', header = None)\n",
        "df"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "98f8602b",
      "metadata": {
        "id": "98f8602b"
      },
      "outputs": [],
      "source": [
        "data = df.iloc[:, 3].values\n",
        "dt = 1\n",
        "dataset_size = len(data)\n",
        "data = create_delay_embedding(data, 3)\n",
        "print(f\"Dataset size: {dataset_size}\")\n",
        "\n",
        "# Train/Test Split\n",
        "train_end = 2000\n",
        "train_input  = data[:train_end]\n",
        "train_target = data[1:train_end+1]\n",
        "test_input   = data[train_end:-1]\n",
        "test_target  = data[train_end+1:]\n",
        "y_test = test_target\n",
        "n_test_steps = len(test_target)\n",
        "time_test = np.arange(n_test_steps) * dt\n",
        "\n",
        "print(f\"Train size: {len(train_input)}\\nTest size: {len(test_input)}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c7684b3f",
      "metadata": {
        "id": "c7684b3f"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [300, 600, 1000]\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    esn = ESN3D(\n",
        "        reservoir_size=300,\n",
        "        spectral_radius=0.95,\n",
        "        connectivity=0.05,\n",
        "        input_scale=0.1,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    esn.fit_readout(train_input, train_target, discard=100)\n",
        "    esn_preds = esn.predict_open_loop(test_input)\n",
        "    esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['ESN'].append(esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    cycle_res = CR3D(\n",
        "        reservoir_size=300,\n",
        "        cycle_weight = 0.8,\n",
        "        spectral_radius=0.95,\n",
        "        input_scale=0.4,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "    cycle_res_preds = cycle_res.predict_open_loop(test_input)\n",
        "    cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    crj = CRJ3D(\n",
        "        reservoir_size=300,\n",
        "        edge_weight=0.8,\n",
        "        jump=5,\n",
        "        spectral_radius=0.95,\n",
        "        input_scale=0.4,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    crj.fit_readout(train_input, train_target, discard=100)\n",
        "    crj_preds = crj.predict_open_loop(test_input)\n",
        "    crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "    nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    mci_esn = MCI3D(\n",
        "        reservoir_size=300,\n",
        "        cycle_weight=0.9,\n",
        "        connect_weight=0.9,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        combine_factor=0.5,\n",
        "        v1=0.5, v2=0.5,\n",
        "        seed=seed\n",
        "    )\n",
        "    mci_esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    mci_esn_preds = mci_esn.predict_open_loop(test_input)\n",
        "    mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    deepesn = DeepESN3D(\n",
        "        num_layers=3,\n",
        "        reservoir_size=100,\n",
        "        spectral_radius=0.95,\n",
        "        input_scale=0.1,\n",
        "        leaking_rate=0.6,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "    deepesn_preds = deepesn.predict_open_loop(test_input)\n",
        "    deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    trigr = GliaNeuronTripartiteReservoirESN(\n",
        "        # sizes\n",
        "        reservoir_size=300,          # N\n",
        "        input_dim=3,\n",
        "        astro_nx=20,                 # grid width\n",
        "        astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "        rel_channels=128,            # P\n",
        "\n",
        "        # kinetics / rates\n",
        "        leak_x=0.45,                 # λ\n",
        "        rate_c=0.05,                 # α\n",
        "        rate_g=0.05,                 # ρ\n",
        "        diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "        # neuron bias\n",
        "        bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "        # nonlinearities (F, Γ)\n",
        "        c_max=1.0,                   # max Ca\n",
        "        k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "        theta_c=0.0,                 # midpoint for F\n",
        "        k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "        theta_g=0.0,                 # midpoint for Γ\n",
        "        zeta=0.0,                    # tonic drive (scalar)\n",
        "        g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "        delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "        # input map\n",
        "        input_scale=0.2,\n",
        "\n",
        "        # randomization / sparsity\n",
        "        W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "        footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "        block_scale=1.0,             # base std for random blocks\n",
        "        eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "        # spectral safety targets (row budgets, both < 1)\n",
        "        rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "        rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "        # read-out\n",
        "        ridge_alpha=1e-6,\n",
        "        use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "        feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "    )\n",
        "    trigr.fit_readout(train_input, train_target, discard=100)\n",
        "    trigr_preds = trigr.predict_open_loop(test_input)\n",
        "    trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TRIGR'].append(trigr_nrmse)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "daaef00f",
      "metadata": {
        "id": "daaef00f"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "49e6ee32",
      "metadata": {
        "id": "49e6ee32"
      },
      "source": [
        "# Sante Fe Dataset"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "2407cfd9",
      "metadata": {
        "id": "2407cfd9"
      },
      "outputs": [],
      "source": [
        "import pandas as pd\n",
        "\n",
        "file_path = 'dataset/santa-fe-time-series/b1.txt'\n",
        "\n",
        "df = pd.read_csv(file_path, header=None, sep=' ')\n",
        "df"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "b5624624",
      "metadata": {
        "id": "b5624624"
      },
      "outputs": [],
      "source": [
        "# Normalize the first column (column 0) of the DataFrame\n",
        "df[0] = (df[0] - df[0].min()) / (df[0].max() - df[0].min())"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "ae5bf803",
      "metadata": {
        "id": "ae5bf803"
      },
      "outputs": [],
      "source": [
        "data = df.iloc[:, 0].values\n",
        "chosen_system = \"SantaFe\"\n",
        "dt = 1\n",
        "T_data = len(data)\n",
        "data = create_delay_embedding(data, 3)\n",
        "print(f\"Data length: {T_data}.\")\n",
        "\n",
        "# Train/Test Split\n",
        "train_end = 7000\n",
        "train_input  = data[:train_end]\n",
        "train_target = data[1:train_end+1]\n",
        "test_input   = data[train_end:-1]\n",
        "test_target  = data[train_end+1:]\n",
        "y_test = test_target\n",
        "n_test_steps = len(test_target)\n",
        "time_test = np.arange(n_test_steps) * dt\n",
        "\n",
        "print(f\"Train size: {len(train_input)}  \\nTest size: {len(test_input)}\")\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "5900d956",
      "metadata": {
        "id": "5900d956"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 500, 1000]\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "for seed in seeds:\n",
        "    esn = ESN3D(\n",
        "        reservoir_size=300,\n",
        "        spectral_radius=0.95,\n",
        "        connectivity=0.05,\n",
        "        input_scale=0.1,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    esn.fit_readout(train_input, train_target, discard=100)\n",
        "    esn_preds = esn.predict_open_loop(test_input)\n",
        "    esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['ESN'].append(esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    cycle_res = CR3D(\n",
        "        reservoir_size=300,\n",
        "        cycle_weight = 0.8,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.4,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    cycle_res.fit_readout(train_input, train_target, discard=100)\n",
        "    cycle_res_preds = cycle_res.predict_open_loop(test_input)\n",
        "    cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    crj = CRJ3D(\n",
        "        reservoir_size=300,\n",
        "        edge_weight=0.8,\n",
        "        jump=5,\n",
        "        spectral_radius=0.95,\n",
        "        input_scale=0.4,\n",
        "        leaking_rate=0.8,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    crj.fit_readout(train_input, train_target, discard=100)\n",
        "    crj_preds = crj.predict_open_loop(test_input)\n",
        "    crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "    nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    mci_esn = MCI3D(\n",
        "        reservoir_size=300,\n",
        "        cycle_weight=0.9,\n",
        "        connect_weight=0.9,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        combine_factor=0.5,\n",
        "        v1=0.5, v2=0.5,\n",
        "        seed=seed\n",
        "    )\n",
        "    mci_esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    mci_esn_preds = mci_esn.predict_open_loop(test_input)\n",
        "    mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    deepesn = DeepESN3D(\n",
        "        num_layers=3,\n",
        "        reservoir_size=100,\n",
        "        spectral_radius=0.85,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.9,\n",
        "        ridge_alpha=1e-4,\n",
        "        seed=seed\n",
        "    )\n",
        "    deepesn.fit_readout(train_input, train_target, discard=100)\n",
        "    deepesn_preds = deepesn.predict_open_loop(test_input)\n",
        "    deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    trigr = GliaNeuronTripartiteReservoirESN(\n",
        "        # sizes\n",
        "        reservoir_size=300,          # N\n",
        "        input_dim=3,\n",
        "        astro_nx=20,                 # grid width\n",
        "        astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "        rel_channels=128,            # P\n",
        "\n",
        "        # kinetics / rates\n",
        "        leak_x=0.45,                 # λ\n",
        "        rate_c=0.05,                 # α\n",
        "        rate_g=0.05,                 # ρ\n",
        "        diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "        # neuron bias\n",
        "        bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "        # nonlinearities (F, Γ)\n",
        "        c_max=1.0,                   # max Ca\n",
        "        k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "        theta_c=0.0,                 # midpoint for F\n",
        "        k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "        theta_g=0.0,                 # midpoint for Γ\n",
        "        zeta=0.0,                    # tonic drive (scalar)\n",
        "        g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "        delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "        # input map\n",
        "        input_scale=0.2,\n",
        "\n",
        "        # randomization / sparsity\n",
        "        W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "        footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "        block_scale=1.0,             # base std for random blocks\n",
        "        eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "        # spectral safety targets (row budgets, both < 1)\n",
        "        rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "        rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "        # read-out\n",
        "        ridge_alpha=1e-6,\n",
        "        use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "        feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "    )\n",
        "    trigr.fit_readout(train_input, train_target, discard=100)\n",
        "    trigr_preds = trigr.predict_open_loop(test_input)\n",
        "    trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TRIGR'].append(trigr_nrmse)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "4a243d60",
      "metadata": {
        "id": "4a243d60"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "b8d211eb",
      "metadata": {
        "id": "b8d211eb"
      },
      "source": [
        "# BIDMC"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "7cc69ef0",
      "metadata": {
        "id": "7cc69ef0"
      },
      "outputs": [],
      "source": [
        "# ─── Load BIDMC Record ─────────────────────────────────────────────────────\n",
        "record_id = 'bidmc01'\n",
        "record = wfdb.rdrecord(record_id, pn_dir='bidmc', sampto=8 * 60 * 125)  # 8 mins at 125Hz\n",
        "signals = record.p_signal  # shape: (60000, 5)\n",
        "names = [n.strip().strip(',') for n in record.sig_name]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "b2190e65",
      "metadata": {
        "id": "b2190e65"
      },
      "outputs": [],
      "source": [
        "# ─── Get Indices of ECG Lead II and RESP ──────────────────────────────────\n",
        "idx_ecg = names.index('II')     # ECG Lead II\n",
        "idx_resp = names.index('RESP')  # Respiration signal"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c08a63f6",
      "metadata": {
        "id": "c08a63f6"
      },
      "outputs": [],
      "source": [
        "# ─── Parameters ────────────────────────────────────────────────────────────\n",
        "N_train = 10000\n",
        "N_test = 5000\n",
        "emb_dim = 3"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "3a6af9b5",
      "metadata": {
        "id": "3a6af9b5"
      },
      "outputs": [],
      "source": [
        "# ─── Select Signals ────────────────────────────────────────────────────────\n",
        "u = signals[:, idx_ecg]   # input: ECG Lead II\n",
        "v = signals[:, idx_resp]  # target: RESP"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "2ff0f51f",
      "metadata": {
        "id": "2ff0f51f"
      },
      "outputs": [],
      "source": [
        "# ─── Normalize to [-1, 1] ──────────────────────────────────────────────────\n",
        "u_norm = 2 * (u - np.min(u)) / (np.max(u) - np.min(u)) - 1\n",
        "v_norm = 2 * (v - np.min(v)) / (np.max(v) - np.min(v)) - 1"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "794a5a6d",
      "metadata": {
        "id": "794a5a6d"
      },
      "outputs": [],
      "source": [
        "# ─── Delay Embedding ───────────────────────────────────────────────────────\n",
        "inputs = create_delay_embedding(u_norm, emb_dim)\n",
        "targets = create_delay_embedding(v_norm, emb_dim)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c3cd40b9",
      "metadata": {
        "id": "c3cd40b9"
      },
      "outputs": [],
      "source": [
        "# ─── Train/Test Split ──────────────────────────────────────────────────────\n",
        "train_input = inputs[:N_train]\n",
        "train_target = targets[:N_train]\n",
        "test_input = inputs[N_train:N_train+N_test]\n",
        "test_target = targets[N_train:N_train+N_test]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "f363f9a6",
      "metadata": {
        "id": "f363f9a6"
      },
      "outputs": [],
      "source": [
        "# ─── Summary ───────────────────────────────────────────────────────────────\n",
        "print(f\"Train input shape:  {train_input.shape}\")\n",
        "print(f\"Train target shape: {train_target.shape}\")\n",
        "print(f\"Test input shape:   {test_input.shape}\")\n",
        "print(f\"Test target shape:  {test_target.shape}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "349200fb",
      "metadata": {
        "id": "349200fb"
      },
      "outputs": [],
      "source": [
        "horizons = [300, 600, 1000]\n",
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "for seed in seeds:\n",
        "    esn = ESN3D(\n",
        "        reservoir_size=300,\n",
        "        spectral_radius=0.95,\n",
        "        connectivity=0.2,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    esn_preds = esn.predict_open_loop(test_input)\n",
        "    esn_nrmse = evaluate_nrmse(esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['ESN'].append(esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    cycle_res = CR3D(\n",
        "        reservoir_size=300,\n",
        "        spectral_radius=0.95,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    cycle_res.fit_readout(train_input, train_target, discard=5000)\n",
        "    cycle_res_preds = cycle_res.predict_open_loop(test_input)\n",
        "    cycle_res_nrmse = evaluate_nrmse(cycle_res_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SCR'].append(cycle_res_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    crj = CRJ3D(\n",
        "        reservoir_size=300,\n",
        "        jump=10,\n",
        "        spectral_radius=0.95,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    crj.fit_readout(train_input, train_target, discard=5000)\n",
        "    crj_preds = crj.predict_open_loop(test_input)\n",
        "    crj_nrmse = evaluate_nrmse(crj_preds, test_target, all_horizons)\n",
        "    nrmse_dict['CRJ'].append(crj_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    mci_esn = MCI3D(\n",
        "        reservoir_size=300,\n",
        "        cycle_weight=0.9,\n",
        "        connect_weight=0.9,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        combine_factor=0.5,\n",
        "        v1=0.5, v2=0.5,\n",
        "        seed=seed\n",
        "    )\n",
        "    mci_esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    mci_esn_preds = mci_esn.predict_open_loop(test_input)\n",
        "    mci_esn_nrmse = evaluate_nrmse(mci_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['MCI-ESN'].append(mci_esn_nrmse)\n",
        "\n",
        "\n",
        "for seed in seeds:\n",
        "    deepesn = DeepESN3D(\n",
        "        num_layers=3,\n",
        "        reservoir_size=100,\n",
        "        spectral_radius=0.95,\n",
        "        connectivity=0.1,\n",
        "        input_scale=1.0,\n",
        "        leaking_rate=0.5,\n",
        "        ridge_alpha=1e-6,\n",
        "        seed=seed\n",
        "    )\n",
        "    deepesn.fit_readout(train_input, train_target, discard=5000)\n",
        "    deepesn_preds = deepesn.predict_open_loop(test_input)\n",
        "    deepesn_nrmse = evaluate_nrmse(deepesn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['DeepESN'].append(deepesn_nrmse)\n",
        "\n",
        "for seed in seeds:\n",
        "    trigr = GliaNeuronTripartiteReservoirESN(\n",
        "        # sizes\n",
        "        reservoir_size=300,          # N\n",
        "        input_dim=3,\n",
        "        astro_nx=20,                 # grid width\n",
        "        astro_ny=20,                 # grid height (M = astro_nx * astro_ny)\n",
        "        rel_channels=128,            # P\n",
        "\n",
        "        # kinetics / rates\n",
        "        leak_x=0.45,                 # λ\n",
        "        rate_c=0.05,                 # α\n",
        "        rate_g=0.05,                 # ρ\n",
        "        diff_D=0.5,                  # D (will be scaled safely)\n",
        "\n",
        "        # neuron bias\n",
        "        bias=0.0,                    # scalar or length-N array\n",
        "\n",
        "        # nonlinearities (F, Γ)\n",
        "        c_max=1.0,                   # max Ca\n",
        "        k_c=1.0,                     # slope for F  (L_F = k_c*c_max/4 ≤ 1 recommended)\n",
        "        theta_c=0.0,                 # midpoint for F\n",
        "        k_g=0.8,                     # slope for Γ  (L_Γ = k_g/4 ≤ 1 recommended)\n",
        "        theta_g=0.0,                 # midpoint for Γ\n",
        "        zeta=0.0,                    # tonic drive (scalar)\n",
        "        g_mode=\"linear\",             # \"linear\" | \"depletion\"\n",
        "        delta_g=0.2,                 # only used if g_mode=\"depletion\"\n",
        "\n",
        "        # input map\n",
        "        input_scale=0.2,\n",
        "\n",
        "        # randomization / sparsity\n",
        "        W_sparsity=0.0,              # fraction of zeros in W_r\n",
        "        footprints_sparsity=0.5,     # initial sparsity in H before row-normalization\n",
        "        block_scale=1.0,             # base std for random blocks\n",
        "        eta_bg=1.0,                  # B_g = eta_bg * H^T (before row scaling)\n",
        "\n",
        "        # spectral safety targets (row budgets, both < 1)\n",
        "        rho_x_target=0.90,           # target for ||W_r|| + ||B_g||\n",
        "        rho_c_target=0.90,           # target for D||L|| + L_F||H W_rel||\n",
        "\n",
        "        # read-out\n",
        "        ridge_alpha=1e-6,\n",
        "        use_poly=True,               # add elementwise squares (except in 'x_x2_g' mode)\n",
        "        feature_mode=\"x_c_g\",        # 'x' | 'x_c_g' | 'x_x2_g'\n",
        "\n",
        "    )\n",
        "    trigr.fit_readout(train_input, train_target, discard=100)\n",
        "    trigr_preds = trigr.predict_open_loop(test_input)\n",
        "    trigr_nrmse = evaluate_nrmse(trigr_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TRIGR'].append(trigr_nrmse)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "36c8ba53",
      "metadata": {
        "id": "36c8ba53"
      },
      "outputs": [],
      "source": [
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'ESN':<17} {'SCR':<17} {'CRJ':<17} {'MCI-ESN':<17} {'DeepESN':<17} {'TRIGR':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    esn_vals = [np.mean(esn_nrmse[horizon]) for esn_nrmse in nrmse_dict['ESN']]\n",
        "    scr_vals = [np.mean(cycle_res_nrmse[horizon]) for cycle_res_nrmse in nrmse_dict['SCR']]\n",
        "    crj_vals = [np.mean(crj_nrmse[horizon]) for crj_nrmse in nrmse_dict['CRJ']]\n",
        "    mci_vals = [np.mean(mci_esn_nrmse[horizon]) for mci_esn_nrmse in nrmse_dict['MCI-ESN']]\n",
        "    deep_vals = [np.mean(deepesn_nrmse[horizon]) for deepesn_nrmse in nrmse_dict['DeepESN']]\n",
        "    trigr_vals = [np.mean(trigr_nrmse[horizon]) for trigr_nrmse in nrmse_dict['TRIGR']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [esn_vals, scr_vals, crj_vals, mci_vals, deep_vals, trigr_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "fa4901ab",
      "metadata": {
        "id": "fa4901ab"
      },
      "source": [
        "# Gradient Based Models"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "c1e2c133",
      "metadata": {
        "id": "c1e2c133"
      },
      "source": [
        "## LSTM"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "196c0a3e",
      "metadata": {
        "id": "196c0a3e"
      },
      "outputs": [],
      "source": [
        "class LSTMBaseline3D:\n",
        "    \"\"\"\n",
        "    Lightweight single-layer LSTM for 3-dim Lorenz forecasting.\n",
        "    * hidden_size=32 \n",
        "    * fit() trains in teacher-forcing mode\n",
        "    * predict() produces autoregressive roll-out\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(self,\n",
        "                 input_dim:  int = 3,\n",
        "                 hidden_size: int = 37,\n",
        "                 output_dim: int = 3,\n",
        "                 lr: float = 1e-3,\n",
        "                 epochs: int = 30,\n",
        "                 device: str = 'cpu',\n",
        "                 seed: int = 0):\n",
        "        torch.manual_seed(seed); np.random.seed(seed)\n",
        "\n",
        "        self.device  = torch.device(device)\n",
        "        self.epochs  = epochs\n",
        "        self.model   = nn.LSTM(input_dim, hidden_size,\n",
        "                               batch_first=True).to(self.device)\n",
        "        self.head    = nn.Linear(hidden_size, output_dim).to(self.device)\n",
        "        self.crit    = nn.MSELoss()\n",
        "        self.optim   = Adam(list(self.model.parameters())+\n",
        "                            list(self.head.parameters()), lr=lr)\n",
        "\n",
        "    def total_parameters(self):\n",
        "        total = 0\n",
        "        for param in list(self.model.parameters()) + list(self.head.parameters()):\n",
        "            total += param.numel()\n",
        "        return total\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    @torch.no_grad()\n",
        "    def _init_hidden(self, batch_sz=1):\n",
        "        h0 = torch.zeros(1, batch_sz,\n",
        "                         self.model.hidden_size,\n",
        "                         device=self.device)\n",
        "        c0 = torch.zeros_like(h0)\n",
        "        return (h0, c0)\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    def fit(self, x_np: np.ndarray, y_np: np.ndarray):\n",
        "        \"\"\"\n",
        "        x_np shape [T, 3]  (input  at t)\n",
        "        y_np shape [T, 3]  (target at t)\n",
        "        \"\"\"\n",
        "        x = torch.tensor(x_np, dtype=torch.float32,\n",
        "                         device=self.device).unsqueeze(0)  # [1,T,3]\n",
        "        y = torch.tensor(y_np, dtype=torch.float32,\n",
        "                         device=self.device).unsqueeze(0)\n",
        "\n",
        "        for _ in range(self.epochs):\n",
        "            self.optim.zero_grad()\n",
        "            out, _ = self.model(x, self._init_hidden())\n",
        "            pred   = self.head(out)\n",
        "            loss   = self.crit(pred, y)\n",
        "            loss.backward()\n",
        "            self.optim.step()\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    @torch.no_grad()\n",
        "    def predict(self, init_u: np.ndarray, n_steps: int):\n",
        "        \"\"\"\n",
        "        Autoregressive roll-out.\n",
        "        init_u : initial 3-vector (last known sample)\n",
        "        Returns array of shape [n_steps, 3].\n",
        "        \"\"\"\n",
        "        self.model.eval(); self.head.eval()\n",
        "\n",
        "        inp     = torch.tensor(init_u[None, None, :],\n",
        "                               dtype=torch.float32, device=self.device)\n",
        "        h, c    = self._init_hidden()\n",
        "        preds   = np.empty((n_steps, 3), dtype=np.float32)\n",
        "\n",
        "        for t in range(n_steps):\n",
        "            out, (h, c) = self.model(inp, (h, c))\n",
        "            y           = self.head(out)\n",
        "            preds[t]    = y.squeeze(0).cpu().numpy()\n",
        "            inp         = y.detach()    # feed prediction back\n",
        "\n",
        "        return preds\n",
        "\n",
        "    @torch.no_grad()\n",
        "    def predict_open_loop(self, x_np: np.ndarray):\n",
        "        \"\"\"\n",
        "        Open-loop prediction using teacher-forced inputs (like during training).\n",
        "        x_np shape: [T, 3] – input sequence\n",
        "        Returns:\n",
        "            preds: [T, 3] – predicted output sequence\n",
        "        \"\"\"\n",
        "        self.model.eval(); self.head.eval()\n",
        "\n",
        "        x = torch.tensor(x_np, dtype=torch.float32,\n",
        "                         device=self.device).unsqueeze(0)  # [1, T, 3]\n",
        "        out, _ = self.model(x, self._init_hidden())\n",
        "        preds = self.head(out).squeeze(0).cpu().numpy()  # [T, 3]\n",
        "\n",
        "        return preds"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "d318d341",
      "metadata": {
        "id": "d318d341"
      },
      "source": [
        "## NVAR"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "625d9916",
      "metadata": {
        "id": "625d9916"
      },
      "outputs": [],
      "source": [
        "class NVARBaseline3D:\n",
        "    \"\"\"\n",
        "    • delay window length k   (default 5 samples)\n",
        "    • quadratic polynomial lift (all monomials up to degree 2)\n",
        "    • closed-form ridge regression read-out\n",
        "    \"\"\"\n",
        "    def __init__(self,\n",
        "                 k: int = 5,\n",
        "                 ridge_alpha: float = 1e-4):\n",
        "        self.k          = k\n",
        "        self.alpha      = ridge_alpha\n",
        "        self.scaler_mu  = None\n",
        "        self.scaler_sig = None\n",
        "        self.reg        = Ridge(alpha=self.alpha, fit_intercept=False)\n",
        "\n",
        "        # indices for quadratic terms\n",
        "        L  = 3 * k                 # length of flattened delay vector\n",
        "        self.idxs_quad = list(combinations_with_replacement(range(L), 2))\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    def _build_feature(self, window: np.ndarray) -> np.ndarray:\n",
        "        \"\"\"\n",
        "        window: shape (k, 3)  -> returns (F,) where\n",
        "          F = 1 + 3k + (3k)(3k+1)/2\n",
        "        \"\"\"\n",
        "        lin = window.flatten()                 # linear terms\n",
        "        quad = np.array([lin[i]*lin[j] for i, j in self.idxs_quad])\n",
        "        return np.concatenate(([1.0], lin, quad), dtype=np.float32)\n",
        "\n",
        "    def total_parameters(self):\n",
        "        total = 0\n",
        "        for param in list(self.model.parameters()) + list(self.head.parameters()):\n",
        "            total += param.numel()\n",
        "        return total\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    def fit(self, x_np: np.ndarray, y_np: np.ndarray):\n",
        "        \"\"\"\n",
        "        x_np shape [T, 3] (driver)\n",
        "        y_np shape [T, 3] (target 1-step ahead)\n",
        "        Assumes x_np[t] predicts y_np[t].\n",
        "        \"\"\"\n",
        "        k = self.k\n",
        "        assert len(x_np) == len(y_np)\n",
        "        # normalise inputs\n",
        "        self.scaler_mu  = x_np.mean(0, keepdims=True)\n",
        "        self.scaler_sig = x_np.std (0, keepdims=True) + 1e-9\n",
        "        x_norm = (x_np - self.scaler_mu)/self.scaler_sig\n",
        "\n",
        "        feats, targets = [], []\n",
        "        for t in range(k, len(x_norm)):\n",
        "            window = x_norm[t-k:t]              # shape (k,3)\n",
        "            feats.append(self._build_feature(window))\n",
        "            targets.append(y_np[t])\n",
        "\n",
        "        X = np.vstack(feats)\n",
        "        Y = np.vstack(targets)\n",
        "        self.reg.fit(X, Y)\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    def predict(self, init_window: np.ndarray, n_steps: int):\n",
        "        \"\"\"\n",
        "        Autoregressive roll-out.\n",
        "        init_window : array (k,3)  – most recent k inputs (y-values).\n",
        "        Returns array (n_steps,3)\n",
        "        \"\"\"\n",
        "        k = self.k\n",
        "        window = init_window.copy()\n",
        "        preds  = np.empty((n_steps, 3), dtype=np.float32)\n",
        "\n",
        "        for t in range(n_steps):\n",
        "            w_norm  = (window - self.scaler_mu)/self.scaler_sig\n",
        "            phi     = self._build_feature(w_norm)\n",
        "            y_hat   = self.reg.predict(phi[None, :])[0]\n",
        "            preds[t] = y_hat\n",
        "            # slide window: drop oldest, append new prediction\n",
        "            window = np.vstack([window[1:], y_hat])\n",
        "\n",
        "        return preds\n",
        "\n",
        "    def predict_open_loop(self, input_sequence: np.ndarray) -> np.ndarray:\n",
        "        \"\"\"\n",
        "        Open-loop (teacher-forced) prediction using true inputs.\n",
        "\n",
        "        Parameters:\n",
        "        - input_sequence: np.ndarray of shape (T, 3), full sequence of inputs.\n",
        "\n",
        "        Returns:\n",
        "        - preds: np.ndarray of shape (T - k, 3), predicted outputs using true inputs.\n",
        "        \"\"\"\n",
        "        k = self.k\n",
        "        x_norm = (input_sequence - self.scaler_mu) / self.scaler_sig\n",
        "        preds = []\n",
        "\n",
        "        for t in range(k, len(x_norm)):\n",
        "            window = x_norm[t-k:t]  # shape (k, 3)\n",
        "            phi = self._build_feature(window)\n",
        "            y_hat = self.reg.predict(phi[None, :])[0]\n",
        "            preds.append(y_hat)\n",
        "\n",
        "        return np.vstack(preds)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "0244cf3c",
      "metadata": {
        "id": "0244cf3c"
      },
      "source": [
        "## Transformer"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "2de6c475",
      "metadata": {
        "id": "2de6c475"
      },
      "outputs": [],
      "source": [
        "class SmallCausalTransformer3D(nn.Module):\n",
        "    \"\"\"\n",
        "    Single-layer causal Transformer:\n",
        "      • d_model = 24,   nhead = 1,   d_ff = 4·d_model\n",
        "      • receptive field  = sequence length L (set in fit / predict)\n",
        "    \"\"\"\n",
        "    def _init_(self,\n",
        "                 d_model: int = 24,\n",
        "                 nhead: int = 1,\n",
        "                 d_ff: int = 96,        # 4 × d_model\n",
        "                 lr: float = 2e-3,\n",
        "                 epochs: int = 60,\n",
        "                 device: str = \"cpu\",\n",
        "                 seed: int = 0):\n",
        "        super()._init_()\n",
        "        torch.manual_seed(seed); np.random.seed(seed)\n",
        "        self.device, self.epochs = device, epochs\n",
        "\n",
        "        self.in_proj   = nn.Linear(3, d_model)     # 3-dim input → tokens\n",
        "        encoder_layer  = nn.TransformerEncoderLayer(\n",
        "                             d_model=d_model,\n",
        "                             nhead=nhead,\n",
        "                             dim_feedforward=d_ff,\n",
        "                             batch_first=True,\n",
        "                             activation=\"gelu\",\n",
        "                             norm_first=True)\n",
        "        self.encoder   = nn.TransformerEncoder(encoder_layer, num_layers=1)\n",
        "        self.pos_embed = None                      # built on first call\n",
        "        self.head      = nn.Linear(d_model, 3)     # back to 3-dim output\n",
        "\n",
        "        self.to(device)\n",
        "        self.opt  = Adam(self.parameters(), lr=lr)\n",
        "        self.crit = nn.MSELoss()\n",
        "\n",
        "    # ----------------------------------------\n",
        "    def _get_posembed(self, L: int, d: int):\n",
        "        \"\"\"Fixed sinusoidal positional embedding (same as Vaswani et al.).\"\"\"\n",
        "        pos = torch.arange(L, dtype=torch.float32, device=self.device)\n",
        "        i   = torch.arange(d//2, dtype=torch.float32, device=self.device)\n",
        "        angles = pos[:, None] / (10000 ** (2*i/d))\n",
        "        pe = torch.zeros(L, d, device=self.device)\n",
        "        pe[:, 0::2] = torch.sin(angles)\n",
        "        pe[:, 1::2] = torch.cos(angles)\n",
        "        return pe[None]                                # shape (1,L,d)\n",
        "\n",
        "    # ----------------------------------------\n",
        "    def total_parameters(self):\n",
        "        return sum(p.numel() for p in self.parameters() if p.requires_grad)\n",
        "\n",
        "\n",
        "    def fit(self, x_np: np.ndarray, y_np: np.ndarray, L: int = 20):\n",
        "        \"\"\"\n",
        "        Teacher-forcing with sliding windows of length L.\n",
        "        x_np, y_np  shape [T, 3];  y_np[t] is the desired prediction for x_np[t].\n",
        "        \"\"\"\n",
        "        x = torch.tensor(x_np, dtype=torch.float32, device=self.device)\n",
        "        y = torch.tensor(y_np, dtype=torch.float32, device=self.device)\n",
        "\n",
        "        if self.pos_embed is None or self.pos_embed.size(1) != L:\n",
        "            self.pos_embed = self._get_posembed(L, self.in_proj.out_features)\n",
        "\n",
        "        # build training batches as overlapping windows (stride 1)\n",
        "        windows   = x.unfold(0, L, 1)        # shape [T-L+1, L, 3]\n",
        "        windows = windows.permute(0, 2, 1)  # (1981, 20, 3)\n",
        "        targets   = y[L-1:]                  # predict the last step\n",
        "        dataset   = torch.utils.data.TensorDataset(windows, targets)\n",
        "        loader    = torch.utils.data.DataLoader(dataset,\n",
        "                                                batch_size=64,\n",
        "                                                shuffle=True)\n",
        "\n",
        "        for _ in range(self.epochs):\n",
        "            for batch_x, batch_y in loader:\n",
        "                self.opt.zero_grad()\n",
        "                z   = self.in_proj(batch_x) + self.pos_embed\n",
        "                out = self.encoder(z)\n",
        "                pred = self.head(out[:, -1])          # last token\n",
        "                loss = self.crit(pred, batch_y)\n",
        "                loss.backward(); self.opt.step()\n",
        "\n",
        "    # ----------------------------------------\n",
        "    @torch.no_grad()\n",
        "    def predict(self, init_window: np.ndarray, n_steps: int):\n",
        "        \"\"\"\n",
        "        Autoregressive roll-out.\n",
        "        init_window : numpy (L,3)  – most recent L samples (old → new)\n",
        "        Returns      : numpy (n_steps,3)\n",
        "        \"\"\"\n",
        "        L = init_window.shape[0]\n",
        "        if self.pos_embed is None or self.pos_embed.size(1) != L:\n",
        "            self.pos_embed = self._get_posembed(L, self.in_proj.out_features)\n",
        "\n",
        "        window = torch.tensor(init_window, dtype=torch.float32,\n",
        "                              device=self.device)\n",
        "        preds  = np.empty((n_steps, 3), dtype=np.float32)\n",
        "\n",
        "        for t in range(n_steps):\n",
        "            z   = self.in_proj(window[None]) + self.pos_embed\n",
        "            y   = self.head(self.encoder(z)[:, -1])[0]\n",
        "            preds[t] = y.cpu().detach().numpy()\n",
        "\n",
        "            window = torch.vstack([window[1:], y])\n",
        "\n",
        "        return preds\n",
        "\n",
        "    def predict_open_loop(self, x_np: np.ndarray):\n",
        "        \"\"\"\n",
        "        Autoregressive roll-out.\n",
        "        init_window : numpy (L,3)  – most recent L samples (old → new)\n",
        "        Returns      : numpy (n_steps,3)\n",
        "        \"\"\"\n",
        "        L = x_np[0].shape[0]\n",
        "        if self.pos_embed is None or self.pos_embed.size(1) != L:\n",
        "            self.pos_embed = self._get_posembed(L, self.in_proj.out_features)\n",
        "\n",
        "        # window = torch.tensor(init_window, dtype=torch.float32,\n",
        "        #                       device=self.device)\n",
        "        preds  = np.empty((len(x_np), 3), dtype=np.float32)\n",
        "\n",
        "        for t in x_np:\n",
        "            t = torch.tensor(t, dtype=torch.float32, device=self.device)\n",
        "            z   = self.in_proj(t) + self.pos_embed\n",
        "            y   = self.head(self.encoder(z)[:, -1])[0]\n",
        "            preds[t] = y.cpu().detach().numpy()\n",
        "        return preds"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "4e7e8f1e",
      "metadata": {
        "id": "4e7e8f1e"
      },
      "source": [
        "## TCN"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "ab5c2f0a",
      "metadata": {
        "id": "ab5c2f0a"
      },
      "outputs": [],
      "source": [
        "class TCNBaseline3D(nn.Module):\n",
        "    \"\"\"\n",
        "    2-layer causal TCN       (kernel=3, dilation=1 & 2, padding chosen\n",
        "    so receptive field = 5 time-steps, identical to NVAR window length).\n",
        "    ----------------------\n",
        "    • input_dim  = 3\n",
        "    • hidden_dim = 32  \n",
        "    • output_dim = 3    (one-step prediction)\n",
        "    \"\"\"\n",
        "    def _init_(self,\n",
        "                 input_dim:  int = 3,\n",
        "                 hidden_dim: int = 32,\n",
        "                 output_dim: int = 3,\n",
        "                 lr: float = 1e-3,\n",
        "                 epochs: int = 40,\n",
        "                 device: str = \"cpu\",\n",
        "                 seed: int = 0):\n",
        "        super()._init_()\n",
        "        torch.manual_seed(seed); np.random.seed(seed)\n",
        "\n",
        "        k = 3  # kernel\n",
        "        # layer 1: dilation 1  → pad 2 to keep length\n",
        "        self.conv1 = nn.Conv1d(input_dim, hidden_dim,\n",
        "                               kernel_size=k,\n",
        "                               dilation=1,\n",
        "                               padding=2,\n",
        "                               bias=True)\n",
        "        # layer 2: dilation 2  → pad 4\n",
        "        self.conv2 = nn.Conv1d(hidden_dim, hidden_dim,\n",
        "                               kernel_size=k,\n",
        "                               dilation=2,\n",
        "                               padding=4,\n",
        "                               bias=True)\n",
        "        self.relu  = nn.ReLU()\n",
        "        self.head  = nn.Conv1d(hidden_dim, output_dim,\n",
        "                               kernel_size=1, bias=True)\n",
        "\n",
        "        self.lr, self.epochs = lr, epochs\n",
        "        self.to(device)\n",
        "        self.optim = Adam(self.parameters(), lr=lr)\n",
        "        self.crit  = nn.MSELoss()\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    def forward(self, x):\n",
        "        \"\"\"\n",
        "        x shape  [B, T, 3]  (batch, time, channels)\n",
        "        return  [B, T, 3]\n",
        "        \"\"\"\n",
        "        # reshape to Conv1d convention: (B, C, T)\n",
        "        x = x.permute(0, 2, 1)\n",
        "        y = self.conv1(x); y = self.relu(y[:, :, :-2])     # remove look-ahead pad\n",
        "        y = self.conv2(y); y = self.relu(y[:, :, :-4])     # remove look-ahead pad\n",
        "        out = self.head(y).permute(0, 2, 1)                # back to (B,T,C)\n",
        "        return out\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    def total_parameters(self):\n",
        "        return sum(p.numel() for p in self.parameters() if p.requires_grad)\n",
        "\n",
        "    def fit(self, x_np: np.ndarray, y_np: np.ndarray):\n",
        "        \"\"\"\n",
        "        Teacher-forcing on entire sequence (batch size = 1).\n",
        "        x_np, y_np shape [T, 3]\n",
        "        \"\"\"\n",
        "        x = torch.tensor(x_np[None], dtype=torch.float32, device=next(self.parameters()).device)\n",
        "        y = torch.tensor(y_np[None], dtype=torch.float32, device=next(self.parameters()).device)\n",
        "\n",
        "        for _ in range(self.epochs):\n",
        "            self.optim.zero_grad()\n",
        "            pred = self.forward(x)\n",
        "            loss = self.crit(pred[:, :-1], y[:, 1:])  # predict next step\n",
        "            loss.backward()\n",
        "            self.optim.step()\n",
        "\n",
        "    # ---------------------------------------------------------\n",
        "    @torch.no_grad()\n",
        "    def predict(self, init_window: np.ndarray, n_steps: int):\n",
        "        \"\"\"\n",
        "        Autoregressive roll-out.\n",
        "        init_window : length L≥5, shape [L,3] (latest samples, earliest first)\n",
        "        Returns      : [n_steps,3]\n",
        "        \"\"\"\n",
        "        device = next(self.parameters()).device\n",
        "        window = init_window.copy()\n",
        "        preds  = np.empty((n_steps, 3), dtype=np.float32)\n",
        "\n",
        "        for t in range(n_steps):\n",
        "            inp = torch.tensor(window[None], dtype=torch.float32, device=device)\n",
        "            y   = self.forward(inp)[0, -1].cpu().detach().numpy()\n",
        "            preds[t] = y\n",
        "            window   = np.vstack([window[1:], y])  # slide window\n",
        "\n",
        "        return preds\n",
        "\n",
        "    def predict_open_loop(self, x_np: np.ndarray):\n",
        "        \"\"\"\n",
        "        Open-loop prediction (teacher-forced inputs).\n",
        "        x_np shape: [T, 3]\n",
        "        Returns:\n",
        "            preds: [T - 1, 3] – one-step-ahead predictions\n",
        "        \"\"\"\n",
        "        self.eval()\n",
        "        device = next(self.parameters()).device\n",
        "\n",
        "        x = torch.tensor(x_np[None], dtype=torch.float32, device=device)  # [1, T, 3]\n",
        "        preds = self.forward(x)  # [1, T, 3]\n",
        "        preds = preds[:, :-1]    # predict from t=0 to t=T-2 for target t=1 to t=T-1\n",
        "\n",
        "        return preds.squeeze(0).cpu().detach().numpy()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "caf03d56",
      "metadata": {
        "id": "caf03d56"
      },
      "source": [
        "## MIT-BIH"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "388ad52e",
      "metadata": {
        "id": "388ad52e"
      },
      "outputs": [],
      "source": [
        "import wfdb\n",
        "\n",
        "# Download and load record and annotations for patient #100\n",
        "record = wfdb.rdrecord('100', sampfrom=0, sampto=25002, pn_dir='mitdb')  # first 20,000 samples\n",
        "annotation = wfdb.rdann('100', 'atr', sampfrom=0, sampto=25002, pn_dir='mitdb')\n",
        "# Get input signal u(t) from the first channel\n",
        "u = record.p_signal[:, 0]\n",
        "u\n",
        "# Normalize input\n",
        "u_min = np.min(u)\n",
        "u_max = np.max(u)\n",
        "u_norm = (u - u_min) / (u_max - u_min)\n",
        "fs = record.fs  # sampling frequency (should be 360 Hz)\n",
        "t_vals = np.arange(len(u_norm)) / fs\n",
        "emb_dim = 3\n",
        "# inputs = u_norm\n",
        "inputs = create_delay_embedding(u_norm, emb_dim)\n",
        "\n",
        "# Create target array (heartbeat locations)\n",
        "targets = np.zeros(len(u_norm))\n",
        "targets[annotation.sample] = 1  # mark annotations as 1 (heartbeat)\n",
        "targets = create_delay_embedding(targets, emb_dim)\n",
        "data_size = len(inputs)\n",
        "train_size = 15000\n",
        "train_input = inputs[:train_size]\n",
        "train_target = targets[:train_size]\n",
        "test_input = inputs[train_size+1:]\n",
        "test_target = targets[train_size+1:]\n",
        "test_size = len(test_input)\n",
        "print(f\"Total samples: {data_size}, train size: {train_size}, test size: {test_size}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "a7c77f51",
      "metadata": {
        "id": "a7c77f51"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "k = 100\n",
        "\n",
        "for seed in seeds:\n",
        "    # NVAR\n",
        "    nvar = NVARBaseline3D(k=k, ridge_alpha=1e-4)\n",
        "    nvar.fit(train_input, train_target)\n",
        "    print(nvar.total_parameters())\n",
        "    nvar_preds = nvar.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(nvar_preds, test_target, all_horizons)\n",
        "    nrmse_dict['NVAR'].append(nrmse)\n",
        "\n",
        "    # LSTM\n",
        "    lstm_baseline = LSTMBaseline3D(hidden_size=500, lr=1e-3, epochs=80, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "    print(lstm_baseline.total_parameters())\n",
        "    lstm_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    lstm_preds = lstm_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(lstm_preds, test_target, all_horizons)\n",
        "    nrmse_dict['LSTM'].append(nrmse)\n",
        "\n",
        "    tcn_baseline = TCNBaseline3D(hidden_dim=600, lr=1e-3, epochs=85, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "    print(tcn_baseline.total_parameters())\n",
        "    tcn_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    tcn_preds = tcn_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(tcn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TCN'].append(nrmse)\n",
        "\n",
        "    transformer_baseline = SmallCausalTransformer3D(d_model= 100,nhead = 1,d_ff = 400,lr=1e-3,epochs=90,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "    print(transformer_baseline.total_parameters())\n",
        "    transformer_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    transformer_preds = transformer_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(transformer_preds, test_target, all_horizons)\n",
        "    nrmse_dict['Transformer'].append(nrmse)\n",
        "\n",
        "\n",
        "horizons = [300, 600, 1000]\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'NVAR':<17} {'LSTM':<17} {'Transformer':<17} {'TCN':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    nvar_vals = [np.mean(nvar_nrmse[horizon]) for nvar_nrmse in nrmse_dict['NVAR']]\n",
        "    lstm_vals = [np.mean(lstm_nrmse[horizon]) for lstm_nrmse in nrmse_dict['LSTM']]\n",
        "    tfmr_vals = [np.mean(tfmr_nrmse[horizon]) for tfmr_nrmse in nrmse_dict['TFMR']]\n",
        "    tcn_vals = [np.mean(tcn_nrmse[horizon]) for tcn_nrmse in nrmse_dict['TCN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [nvar_vals, lstm_vals, tfmr_vals, tcn_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean} ± {std}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "4dc79e4b",
      "metadata": {
        "id": "4dc79e4b"
      },
      "source": [
        "## Sunspot"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "e9246aef",
      "metadata": {
        "id": "e9246aef"
      },
      "outputs": [],
      "source": [
        "import pandas as pd\n",
        "file_path = 'dataset/SN_m_tot_V2.0.csv'\n",
        "\n",
        "df = pd.read_csv(file_path, sep=';', header = None)\n",
        "df\n",
        "data = df.iloc[:, 3].values\n",
        "dt = 1\n",
        "dataset_size = len(data)\n",
        "data = create_delay_embedding(data, 3)\n",
        "print(f\"Dataset size: {dataset_size}\")\n",
        "\n",
        "# Train/Test Split\n",
        "train_end = 2000\n",
        "train_input  = data[:train_end]\n",
        "train_target = data[1:train_end+1]\n",
        "test_input   = data[train_end:-1]\n",
        "test_target  = data[train_end+1:]\n",
        "y_test = test_target\n",
        "n_test_steps = len(test_target)\n",
        "time_test = np.arange(n_test_steps) * dt\n",
        "\n",
        "print(f\"Train size: {len(train_input)}\\nTest size: {len(test_input)}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "84a28e3e",
      "metadata": {
        "id": "84a28e3e"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "k = 100\n",
        "\n",
        "for seed in seeds:\n",
        "    # NVAR\n",
        "    nvar = NVARBaseline3D(k=k, ridge_alpha=1e-4)\n",
        "    nvar.fit(train_input, train_target)\n",
        "    print(nvar.total_parameters())\n",
        "    nvar_preds = nvar.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(nvar_preds, test_target, all_horizons)\n",
        "    nrmse_dict['NVAR'].append(nrmse)\n",
        "\n",
        "    # LSTM\n",
        "    lstm_baseline = LSTMBaseline3D(hidden_size=1000, lr=1e-3, epochs=200, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "    print(lstm_baseline.total_parameters())\n",
        "    lstm_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    lstm_preds = lstm_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(lstm_preds, test_target, all_horizons)\n",
        "    nrmse_dict['LSTM'].append(nrmse)\n",
        "\n",
        "    tcn_baseline = TCNBaseline3D(hidden_dim=400,lr=1e-3,epochs=70,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "    print(tcn_baseline.total_parameters())\n",
        "    tcn_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    tcn_preds = tcn_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(tcn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TCN'].append(nrmse)\n",
        "\n",
        "    transformer_baseline = SmallCausalTransformer3D(d_model= 80,nhead = 1,d_ff = 320,lr=1e-3,epochs=65,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "    print(transformer_baseline.total_parameters())\n",
        "    transformer_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    transformer_preds = transformer_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(transformer_preds, test_target, all_horizons)\n",
        "    nrmse_dict['Transformer'].append(nrmse)\n",
        "\n",
        "\n",
        "horizons = [300, 600, 1000]\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'NVAR':<17} {'LSTM':<17} {'Transformer':<17} {'TCN':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    nvar_vals = [np.mean(nvar_nrmse[horizon]) for nvar_nrmse in nrmse_dict['NVAR']]\n",
        "    lstm_vals = [np.mean(lstm_nrmse[horizon]) for lstm_nrmse in nrmse_dict['LSTM']]\n",
        "    tfmr_vals = [np.mean(tfmr_nrmse[horizon]) for tfmr_nrmse in nrmse_dict['TFMR']]\n",
        "    tcn_vals = [np.mean(tcn_nrmse[horizon]) for tcn_nrmse in nrmse_dict['TCN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [nvar_vals, lstm_vals, tfmr_vals, tcn_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean} ± {std}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "06001aca",
      "metadata": {
        "id": "06001aca"
      },
      "source": [
        "## Santa Fe"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "d19fa9f5",
      "metadata": {
        "id": "d19fa9f5"
      },
      "outputs": [],
      "source": [
        "import pandas as pd\n",
        "\n",
        "file_path = 'dataset/santa-fe-time-series/b1.txt'\n",
        "\n",
        "df = pd.read_csv(file_path, header=None, sep=' ')\n",
        "df\n",
        "# Normalize the first column (column 0) of the DataFrame\n",
        "df[0] = (df[0] - df[0].min()) / (df[0].max() - df[0].min())\n",
        "data = df.iloc[:, 0].values\n",
        "chosen_system = \"SantaFe\"\n",
        "dt = 1\n",
        "T_data = len(data)\n",
        "data = create_delay_embedding(data, 3)\n",
        "print(f\"Data length: {T_data}.\")\n",
        "\n",
        "# Train/Test Split\n",
        "train_end = 7000\n",
        "train_input  = data[:train_end]\n",
        "train_target = data[1:train_end+1]\n",
        "test_input   = data[train_end:-1]\n",
        "test_target  = data[train_end+1:]\n",
        "y_test = test_target\n",
        "n_test_steps = len(test_target)\n",
        "time_test = np.arange(n_test_steps) * dt\n",
        "\n",
        "print(f\"Train size: {len(train_input)}  \\nTest size: {len(test_input)}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "662a21e3",
      "metadata": {
        "id": "662a21e3"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "k = 100\n",
        "\n",
        "for seed in seeds:\n",
        "    # NVAR\n",
        "    nvar = NVARBaseline3D(k=k, ridge_alpha=1e-4)\n",
        "    nvar.fit(train_input, train_target)\n",
        "    print(nvar.total_parameters())\n",
        "    nvar_preds = nvar.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(nvar_preds, test_target, all_horizons)\n",
        "    nrmse_dict['NVAR'].append(nrmse)\n",
        "\n",
        "    # LSTM\n",
        "    lstm_baseline = LSTMBaseline3D(hidden_size=500, lr=1e-3, epochs=80, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "    print(lstm_baseline.total_parameters())\n",
        "    lstm_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    lstm_preds = lstm_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(lstm_preds, test_target, all_horizons)\n",
        "    nrmse_dict['LSTM'].append(nrmse)\n",
        "\n",
        "    tcn_baseline = TCNBaseline3D(hidden_dim=500,lr=1e-3,epochs=85,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "    print(tcn_baseline.total_parameters())\n",
        "    tcn_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    tcn_preds = tcn_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(tcn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TCN'].append(nrmse)\n",
        "\n",
        "    transformer_baseline = SmallCausalTransformer3D(d_model= 100,nhead = 1,d_ff = 400,lr=1e-3,epochs=100,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "    print(transformer_baseline.total_parameters())\n",
        "    transformer_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    transformer_preds = transformer_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(transformer_preds, test_target, all_horizons)\n",
        "    nrmse_dict['Transformer'].append(nrmse)\n",
        "\n",
        "\n",
        "horizons = [300, 600, 1000]\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'NVAR':<17} {'LSTM':<17} {'Transformer':<17} {'TCN':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    nvar_vals = [np.mean(nvar_nrmse[horizon]) for nvar_nrmse in nrmse_dict['NVAR']]\n",
        "    lstm_vals = [np.mean(lstm_nrmse[horizon]) for lstm_nrmse in nrmse_dict['LSTM']]\n",
        "    tfmr_vals = [np.mean(tfmr_nrmse[horizon]) for tfmr_nrmse in nrmse_dict['TFMR']]\n",
        "    tcn_vals = [np.mean(tcn_nrmse[horizon]) for tcn_nrmse in nrmse_dict['TCN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [nvar_vals, lstm_vals, tfmr_vals, tcn_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean} ± {std}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "d6bdb6ae",
      "metadata": {
        "id": "d6bdb6ae"
      },
      "source": [
        "## BIDMC"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "b2faac0c",
      "metadata": {
        "id": "b2faac0c"
      },
      "outputs": [],
      "source": [
        "# ─── Load BIDMC Record ─────────────────────────────────────────────────────\n",
        "record_id = 'bidmc01'\n",
        "record = wfdb.rdrecord(record_id, pn_dir='bidmc', sampto=8 * 60 * 125)  # 8 mins at 125Hz\n",
        "signals = record.p_signal  # shape: (60000, 5)\n",
        "names = [n.strip().strip(',') for n in record.sig_name]\n",
        "# ─── Get Indices of ECG Lead II and RESP ──────────────────────────────────\n",
        "idx_ecg = names.index('II')     # ECG Lead II\n",
        "idx_resp = names.index('RESP')  # Respiration signal\n",
        "# ─── Parameters ────────────────────────────────────────────────────────────\n",
        "N_train = 10000\n",
        "N_test = 5000\n",
        "emb_dim = 3\n",
        "# ─── Select Signals ────────────────────────────────────────────────────────\n",
        "u = signals[:, idx_ecg]   # input: ECG Lead II\n",
        "v = signals[:, idx_resp]  # target: RESP\n",
        "# ─── Normalize to [-1, 1] ──────────────────────────────────────────────────\n",
        "u_norm = 2 * (u - np.min(u)) / (np.max(u) - np.min(u)) - 1\n",
        "v_norm = 2 * (v - np.min(v)) / (np.max(v) - np.min(v)) - 1\n",
        "# ─── Delay Embedding ───────────────────────────────────────────────────────\n",
        "inputs = create_delay_embedding(u_norm, emb_dim)\n",
        "targets = create_delay_embedding(v_norm, emb_dim)\n",
        "# ─── Train/Test Split ──────────────────────────────────────────────────────\n",
        "train_input = inputs[:N_train]\n",
        "train_target = targets[:N_train]\n",
        "test_input = inputs[N_train:N_train+N_test]\n",
        "test_target = targets[N_train:N_train+N_test]\n",
        "# ─── Summary ───────────────────────────────────────────────────────────────\n",
        "print(f\"Train input shape:  {train_input.shape}\")\n",
        "print(f\"Train target shape: {train_target.shape}\")\n",
        "print(f\"Test input shape:   {test_input.shape}\")\n",
        "print(f\"Test target shape:  {test_target.shape}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "831278b0",
      "metadata": {
        "id": "831278b0"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "k = 100\n",
        "\n",
        "for seed in seeds:\n",
        "    # NVAR\n",
        "    nvar = NVARBaseline3D(k=k, ridge_alpha=1e-4)\n",
        "    nvar.fit(train_input, train_target)\n",
        "    print(nvar.total_parameters())\n",
        "    nvar_preds = nvar.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(nvar_preds, test_target, all_horizons)\n",
        "    nrmse_dict['NVAR'].append(nrmse)\n",
        "\n",
        "    # LSTM\n",
        "    lstm_baseline = LSTMBaseline3D(hidden_size=500, lr=1e-3, epochs=80, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "    print(lstm_baseline.total_parameters())\n",
        "    lstm_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    lstm_preds = lstm_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(lstm_preds, test_target, all_horizons)\n",
        "    nrmse_dict['LSTM'].append(nrmse)\n",
        "\n",
        "    tcn_baseline = TCNBaseline3D(hidden_dim=800,lr=1e-3,epochs=120,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "    print(tcn_baseline.total_parameters())\n",
        "    tcn_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    tcn_preds = tcn_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(tcn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['TCN'].append(nrmse)\n",
        "\n",
        "    transformer_baseline = SmallCausalTransformer3D(d_model= 80,nhead = 2,d_ff = 320,lr=1e-3,epochs=120,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "    print(transformer_baseline.total_parameters())\n",
        "    transformer_baseline.fit(train_input, train_target)\n",
        "    # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "    init_vec = train_target[-1]                # last teacher-forced target\n",
        "    transformer_preds = transformer_baseline.predict_open_loop(test_input)\n",
        "    nrmse = evaluate_nrmse(transformer_preds, test_target, all_horizons)\n",
        "    nrmse_dict['Transformer'].append(nrmse)\n",
        "\n",
        "\n",
        "horizons = [300, 600, 1000]\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'NVAR':<17} {'LSTM':<17} {'Transformer':<17} {'TCN':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    nvar_vals = [np.mean(nvar_nrmse[horizon]) for nvar_nrmse in nrmse_dict['NVAR']]\n",
        "    lstm_vals = [np.mean(lstm_nrmse[horizon]) for lstm_nrmse in nrmse_dict['LSTM']]\n",
        "    tfmr_vals = [np.mean(tfmr_nrmse[horizon]) for tfmr_nrmse in nrmse_dict['TFMR']]\n",
        "    tcn_vals = [np.mean(tcn_nrmse[horizon]) for tcn_nrmse in nrmse_dict['TCN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [nvar_vals, lstm_vals, tfmr_vals, tcn_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean} ± {std}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "780d1a7b",
      "metadata": {
        "id": "780d1a7b"
      },
      "source": [
        "## Canonical Benchmarks"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "8572e01b",
      "metadata": {
        "id": "8572e01b"
      },
      "source": [
        "#### Lorenz"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "d0878bdb",
      "metadata": {
        "id": "d0878bdb"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_lorenz = 0.9\n",
        "lyapunov_time_lorenz = 1.0 / lle_lorenz\n",
        "lyapunov_time = lyapunov_time_lorenz\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.7,0.75,0.8]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "nrmse_dict = defaultdict(list)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "cb27eefb",
      "metadata": {
        "id": "cb27eefb"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, lorenz_traj = generate_lorenz_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(lorenz_traj)\n",
        "    lorenz_traj = scaler.transform(lorenz_traj)\n",
        "    T_data = len(lorenz_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = lorenz_traj[:train_end]\n",
        "        train_target = lorenz_traj[1:train_end + 1]\n",
        "        test_input = lorenz_traj[train_end:-1]\n",
        "        test_target = lorenz_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            # NVAR\n",
        "            nvar = NVARBaseline3D(k=100, ridge_alpha=1e-4)\n",
        "            nvar.fit(train_input, train_target)\n",
        "            print(nvar.total_parameters())\n",
        "            nvar_preds = nvar.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(nvar_preds, test_target, all_horizons)\n",
        "            nrmse_dict['NVAR'].append(nrmse)\n",
        "\n",
        "            # LSTM\n",
        "            lstm_baseline = LSTMBaseline3D(hidden_size=500, lr=1e-3, epochs=80, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "            print(lstm_baseline.total_parameters())\n",
        "            lstm_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]\n",
        "            lstm_preds = lstm_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(lstm_preds, test_target, all_horizons)\n",
        "            nrmse_dict['LSTM'].append(nrmse)\n",
        "\n",
        "            tcn_baseline = TCNBaseline3D(hidden_dim=1500,lr=1e-3,epochs=180,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "            print(tcn_baseline.total_parameters())\n",
        "            tcn_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]\n",
        "            tcn_preds = tcn_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(tcn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TCN'].append(nrmse)\n",
        "\n",
        "            transformer_baseline = SmallCausalTransformer3D(d_model= 200,nhead = 2,d_ff = 800,lr=1e-3,epochs=100,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "            print(transformer_baseline.total_parameters())\n",
        "            transformer_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]\n",
        "            transformer_preds = transformer_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(transformer_preds, test_target, all_horizons)\n",
        "            nrmse_dict['Transformer'].append(nrmse)\n",
        "\n",
        "\n",
        "horizons = [300, 600, 1000]\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'NVAR':<17} {'LSTM':<17} {'Transformer':<17} {'TCN':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    nvar_vals = [np.mean(nvar_nrmse[horizon]) for nvar_nrmse in nrmse_dict['NVAR']]\n",
        "    lstm_vals = [np.mean(lstm_nrmse[horizon]) for lstm_nrmse in nrmse_dict['LSTM']]\n",
        "    tfmr_vals = [np.mean(tfmr_nrmse[horizon]) for tfmr_nrmse in nrmse_dict['TFMR']]\n",
        "    tcn_vals = [np.mean(tcn_nrmse[horizon]) for tcn_nrmse in nrmse_dict['TCN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [nvar_vals, lstm_vals, tfmr_vals, tcn_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean} ± {std}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "c904d585",
      "metadata": {
        "id": "c904d585"
      },
      "source": [
        "#### Rossler"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "0214bfae",
      "metadata": {
        "id": "0214bfae"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_rossler = 0.071\n",
        "lyapunov_time_rossler = 1.0 / lle_rossler\n",
        "lyapunov_time = lyapunov_time_rossler\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.3, 0.35, 0.4]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "nrmse_dict = defaultdict(list)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "4f2e21c0",
      "metadata": {
        "id": "4f2e21c0"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, rossler_traj = generate_rossler_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    rossler_traj = rossler_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(rossler_traj)\n",
        "    rossler_traj = scaler.transform(rossler_traj)\n",
        "    T_data = len(rossler_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = rossler_traj[:train_end]\n",
        "        train_target = rossler_traj[1:train_end + 1]\n",
        "        test_input = rossler_traj[train_end:-1]\n",
        "        test_target = rossler_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            # NVAR\n",
        "            nvar = NVARBaseline3D(k=100, ridge_alpha=1e-4)\n",
        "            nvar.fit(train_input, train_target)\n",
        "            print(nvar.total_parameters())\n",
        "            nvar_preds = nvar.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(nvar_preds, test_target, all_horizons)\n",
        "            nrmse_dict['NVAR'].append(nrmse)\n",
        "\n",
        "            # LSTM\n",
        "            lstm_baseline = LSTMBaseline3D(hidden_size=500, lr=1e-3, epochs=80, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "            print(lstm_baseline.total_parameters())\n",
        "            lstm_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]                # last teacher-forced target\n",
        "            lstm_preds = lstm_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(lstm_preds, test_target, all_horizons)\n",
        "            nrmse_dict['LSTM'].append(nrmse)\n",
        "\n",
        "            tcn_baseline = TCNBaseline3D(hidden_dim=800,lr=1e-3,epochs=150,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "            print(tcn_baseline.total_parameters())\n",
        "            tcn_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]\n",
        "            tcn_preds = tcn_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(tcn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TCN'].append(nrmse)\n",
        "\n",
        "            transformer_baseline = SmallCausalTransformer3D(d_model= 200,nhead = 2,d_ff = 800,lr=1e-3,epochs=120,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "            print(transformer_baseline.total_parameters())\n",
        "            transformer_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]\n",
        "            transformer_preds = transformer_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(transformer_preds, test_target, all_horizons)\n",
        "            nrmse_dict['Transformer'].append(nrmse)\n",
        "\n",
        "\n",
        "horizons = [300, 600, 1000]\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'NVAR':<17} {'LSTM':<17} {'Transformer':<17} {'TCN':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    nvar_vals = [np.mean(nvar_nrmse[horizon]) for nvar_nrmse in nrmse_dict['NVAR']]\n",
        "    lstm_vals = [np.mean(lstm_nrmse[horizon]) for lstm_nrmse in nrmse_dict['LSTM']]\n",
        "    tfmr_vals = [np.mean(tfmr_nrmse[horizon]) for tfmr_nrmse in nrmse_dict['TFMR']]\n",
        "    tcn_vals = [np.mean(tcn_nrmse[horizon]) for tcn_nrmse in nrmse_dict['TCN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [nvar_vals, lstm_vals, tfmr_vals, tcn_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean} ± {std}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "c07f8416",
      "metadata": {
        "id": "c07f8416"
      },
      "source": [
        "#### Chen"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "6a3360db",
      "metadata": {
        "id": "6a3360db"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_chen = 0.829\n",
        "lyapunov_time_chen = 1.0 / lle_chen\n",
        "lyapunov_time = lyapunov_time_chen\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.7, 0.75, 0.8]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "nrmse_dict = defaultdict(list)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "6e3e7fde",
      "metadata": {
        "id": "6e3e7fde"
      },
      "outputs": [],
      "source": [
        "for initial_state in initial_states:\n",
        "    t_vals, chen_traj = generate_chen_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    chen_traj = chen_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(chen_traj)\n",
        "    chen_traj = scaler.transform(chen_traj)\n",
        "    T_data = len(chen_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = chen_traj[:train_end]\n",
        "        train_target = chen_traj[1:train_end + 1]\n",
        "        test_input = chen_traj[train_end:-1]\n",
        "        test_target = chen_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            # NVAR\n",
        "            nvar = NVARBaseline3D(k=100, ridge_alpha=1e-4)\n",
        "            nvar.fit(train_input, train_target)\n",
        "            print(nvar.total_parameters())\n",
        "            nvar_preds = nvar.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(nvar_preds, test_target, all_horizons)\n",
        "            nrmse_dict['NVAR'].append(nrmse)\n",
        "\n",
        "            # LSTM\n",
        "            lstm_baseline = LSTMBaseline3D(hidden_size=500, lr=1e-3, epochs=80, device='cuda' if torch.cuda.is_available() else 'cpu', seed=seed)\n",
        "            print(lstm_baseline.total_parameters())\n",
        "            lstm_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]                # last teacher-forced target\n",
        "            lstm_preds = lstm_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(lstm_preds, test_target, all_horizons)\n",
        "            nrmse_dict['LSTM'].append(nrmse)\n",
        "\n",
        "            tcn_baseline = TCNBaseline3D(hidden_dim=1500,lr=1e-3,epochs=180,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "            print(tcn_baseline.total_parameters())\n",
        "            tcn_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]\n",
        "            tcn_preds = tcn_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(tcn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['TCN'].append(nrmse)\n",
        "\n",
        "            transformer_baseline = SmallCausalTransformer3D(d_model= 200,nhead = 2,d_ff = 800,lr=1e-3,epochs=100,device='cuda' if torch.cuda.is_available() else 'cpu',seed=seed)\n",
        "            print(transformer_baseline.total_parameters())\n",
        "            transformer_baseline.fit(train_input, train_target)\n",
        "            # one-step roll-out to build an initial vector for auto-regressive mode\n",
        "            init_vec = train_target[-1]\n",
        "            transformer_preds = transformer_baseline.predict(initial_in, n_test_steps)\n",
        "            nrmse = evaluate_nrmse(transformer_preds, test_target, all_horizons)\n",
        "            nrmse_dict['Transformer'].append(nrmse)\n",
        "\n",
        "horizons = [300, 600, 1000]\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'NVAR':<17} {'LSTM':<17} {'Transformer':<17} {'TCN':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "for horizon in horizons:\n",
        "    nvar_vals = [np.mean(nvar_nrmse[horizon]) for nvar_nrmse in nrmse_dict['NVAR']]\n",
        "    lstm_vals = [np.mean(lstm_nrmse[horizon]) for lstm_nrmse in nrmse_dict['LSTM']]\n",
        "    tfmr_vals = [np.mean(tfmr_nrmse[horizon]) for tfmr_nrmse in nrmse_dict['TFMR']]\n",
        "    tcn_vals = [np.mean(tcn_nrmse[horizon]) for tcn_nrmse in nrmse_dict['TCN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [nvar_vals, lstm_vals, tfmr_vals, tcn_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean} ± {std}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "dfb18485",
      "metadata": {
        "id": "dfb18485"
      },
      "source": [
        "## Small World Reservoir"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "c31c25e8",
      "metadata": {
        "id": "c31c25e8"
      },
      "outputs": [],
      "source": [
        "class SWRes3D:\n",
        "    \"\"\"\n",
        "    Small-World Reservoir ESN for 3D -> 3D single-step prediction.\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(self,\n",
        "                 reservoir_size=300,\n",
        "                 rewiring_prob=0.1,\n",
        "                 degree=6,\n",
        "                 spectral_radius=0.95,\n",
        "                 input_scale=1.0,\n",
        "                 leaking_rate=1.0,\n",
        "                 ridge_alpha=1e-6,\n",
        "                 activation_choices=('tanh', 'relu', 'sin', 'linear'),\n",
        "                 seed=42):\n",
        "\n",
        "        self.reservoir_size = reservoir_size\n",
        "        self.rewiring_prob = rewiring_prob\n",
        "        self.degree = degree\n",
        "        self.spectral_radius = spectral_radius\n",
        "        self.input_scale = input_scale\n",
        "        self.leaking_rate = leaking_rate\n",
        "        self.ridge_alpha = ridge_alpha\n",
        "        self.activation_choices = activation_choices\n",
        "        self.seed = seed\n",
        "\n",
        "        np.random.seed(self.seed)\n",
        "        ws_graph = nx.watts_strogatz_graph(n=reservoir_size, k=degree, p=rewiring_prob, seed=seed)\n",
        "        A = nx.to_numpy_array(ws_graph)\n",
        "        W = A * np.random.uniform(-1, 1, size=A.shape)\n",
        "        self.W = scale_spectral_radius(W, spectral_radius)\n",
        "\n",
        "        np.random.seed(self.seed + 100)\n",
        "        self.W_in = (np.random.rand(reservoir_size, 3) - 0.5) * 2 * input_scale\n",
        "\n",
        "        np.random.seed(self.seed + 200)\n",
        "        self.node_activations = np.random.choice(activation_choices, size=reservoir_size)\n",
        "\n",
        "        self.reset_state()\n",
        "        self.W_out = None\n",
        "\n",
        "    def reset_state(self):\n",
        "        self.x = np.zeros(self.reservoir_size)\n",
        "\n",
        "    def _apply_activation(self, kind, val):\n",
        "        return np.tanh(val)\n",
        "\n",
        "    def _update(self, u):\n",
        "        pre = self.W @ self.x + self.W_in @ u\n",
        "        x_new = np.zeros_like(self.x)\n",
        "        for i in range(self.reservoir_size):\n",
        "            act = self.node_activations[i]\n",
        "            x_new[i] = self._apply_activation(act, pre[i])\n",
        "        self.x = (1 - self.leaking_rate) * self.x + self.leaking_rate * x_new\n",
        "\n",
        "    def collect_states(self, inputs, discard=100):\n",
        "        self.reset_state()\n",
        "        states = []\n",
        "        for u in inputs:\n",
        "            self._update(u)\n",
        "            states.append(self.x.copy())\n",
        "        return np.array(states)[discard:], np.array(states)[:discard]\n",
        "\n",
        "    def fit_readout(self, train_input, train_target, discard=100):\n",
        "        states, _ = self.collect_states(train_input, discard=discard)\n",
        "        targets = train_target[discard:]\n",
        "\n",
        "        X_aug = np.hstack([states, states**2, np.ones((len(states), 1))])\n",
        "        ridge = Ridge(alpha=self.ridge_alpha, fit_intercept=False)\n",
        "        ridge.fit(X_aug, targets)\n",
        "        self.W_out = ridge.coef_\n",
        "\n",
        "    def predict_open_loop(self, inputs):\n",
        "        preds = []\n",
        "        for u in inputs:\n",
        "            self._update(u)\n",
        "            x_aug = np.concatenate([self.x, self.x**2, [1.0]])\n",
        "            preds.append(self.W_out @ x_aug)\n",
        "        return np.array(preds)\n",
        "\n",
        "    def predict_autoregressive(self, initial_input, num_steps):\n",
        "        preds = []\n",
        "        current = initial_input.copy()\n",
        "        for _ in range(num_steps):\n",
        "            self._update(current)\n",
        "            x_aug = np.concatenate([self.x, self.x**2, [1.0]])\n",
        "            out = self.W_out @ x_aug\n",
        "            preds.append(out)\n",
        "            current = out\n",
        "        return np.array(preds)"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "5c035892",
      "metadata": {
        "id": "5c035892"
      },
      "source": [
        "### Lorenz"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "e87e168c",
      "metadata": {
        "id": "e87e168c"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_lorenz = 0.9\n",
        "lyapunov_time_lorenz = 1.0 / lle_lorenz\n",
        "lyapunov_time = lyapunov_time_lorenz\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.7,0.75,0.8]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "VPT_dict = defaultdict(list)\n",
        "VPT_ratio_dict = defaultdict(list)\n",
        "adev_dict = defaultdict(list)\n",
        "\n",
        "for initial_state in initial_states:\n",
        "    t_vals, lorenz_traj = generate_lorenz_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    lorenz_traj = lorenz_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(lorenz_traj)\n",
        "    lorenz_traj = scaler.transform(lorenz_traj)\n",
        "    T_data = len(lorenz_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = lorenz_traj[:train_end]\n",
        "        train_target = lorenz_traj[1:train_end + 1]\n",
        "        test_input = lorenz_traj[train_end:-1]\n",
        "        test_target = lorenz_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            sw_esn = SWRes3D(\n",
        "                reservoir_size=300,\n",
        "                rewiring_prob=0.3,\n",
        "                degree=6,\n",
        "                spectral_radius=0.99,\n",
        "                input_scale=0.2,\n",
        "                leaking_rate=0.7,\n",
        "                ridge_alpha=1e-5,\n",
        "                seed=seed\n",
        "            )\n",
        "            sw_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            sw_esn_preds = sw_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            sw_esn_nrmse = evaluate_nrmse(sw_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SW-ESN'].append(sw_esn_nrmse)\n",
        "            sw_esn_VPT, sw_esn_VPT_ratio = compute_valid_prediction_time(test_target, sw_esn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['SW-ESN'].append(sw_esn_VPT)\n",
        "            VPT_ratio_dict['SW-ESN'].append(sw_esn_VPT_ratio)\n",
        "            sw_esn_adev = compute_attractor_deviation(sw_esn_preds, test_target)\n",
        "            adev_dict['SW-ESN'].append(sw_esn_adev)\n",
        "\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'SW':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    sw_vals = [np.mean(sw_nrmse[horizon]) for sw_nrmse in nrmse_dict['SW']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [sw_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "15c897cc",
      "metadata": {
        "id": "15c897cc"
      },
      "source": [
        "### Rossler"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "33e46aeb",
      "metadata": {
        "id": "33e46aeb"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_rossler = 0.071\n",
        "lyapunov_time_rossler = 1.0 / lle_rossler\n",
        "lyapunov_time = lyapunov_time_rossler\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.3, 0.35, 0.4]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "VPT_dict = defaultdict(list)\n",
        "VPT_ratio_dict = defaultdict(list)\n",
        "adev_dict = defaultdict(list)\n",
        "\n",
        "for initial_state in initial_states:\n",
        "    t_vals, rossler_traj = generate_rossler_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    rossler_traj = rossler_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(rossler_traj)\n",
        "    rossler_traj = scaler.transform(rossler_traj)\n",
        "    T_data = len(rossler_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = rossler_traj[:train_end]\n",
        "        train_target = rossler_traj[1:train_end + 1]\n",
        "        test_input = rossler_traj[train_end:-1]\n",
        "        test_target = rossler_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            sw_esn = SWRes3D(\n",
        "                reservoir_size=300,\n",
        "                rewiring_prob=0.3,\n",
        "                degree=6,\n",
        "                spectral_radius=0.99,\n",
        "                input_scale=0.2,\n",
        "                leaking_rate=0.7,\n",
        "                ridge_alpha=1e-5,\n",
        "                seed=seed\n",
        "            )\n",
        "            sw_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            sw_esn_preds = sw_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            sw_esn_nrmse = evaluate_nrmse(sw_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SW-ESN'].append(sw_esn_nrmse)\n",
        "            sw_esn_VPT, sw_esn_VPT_ratio = compute_valid_prediction_time(test_target, sw_esn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['SW-ESN'].append(sw_esn_VPT)\n",
        "            VPT_ratio_dict['SW-ESN'].append(sw_esn_VPT_ratio)\n",
        "            sw_esn_adev = compute_attractor_deviation(sw_esn_preds, test_target)\n",
        "            adev_dict['SW-ESN'].append(sw_esn_adev)\n",
        "\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'SW':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    sw_vals = [np.mean(sw_nrmse[horizon]) for sw_nrmse in nrmse_dict['SW']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [sw_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "42e55c4e",
      "metadata": {
        "id": "42e55c4e"
      },
      "source": [
        "### Chen"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "5b8dcaeb",
      "metadata": {
        "id": "5b8dcaeb"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "horizons = [200, 400, 600, 800, 1000]\n",
        "initial_input = test_input[0]\n",
        "num_steps = len(test_input)\n",
        "lle_chen = 0.829\n",
        "lyapunov_time_chen = 1.0 / lle_chen\n",
        "lyapunov_time = lyapunov_time_chen\n",
        "VPT_threshold = 0.4\n",
        "test_time = np.arange(test_size)*dt\n",
        "seeds = range(1, 6)\n",
        "train_fracs = [0.7, 0.75, 0.8]\n",
        "initial_states = [[1.0, 1.0, 1.0], [1.0, 2.0, 3.0], [2.0, 1.5, 4.0]]\n",
        "tmax = 250\n",
        "dt = 0.02\n",
        "\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "VPT_dict = defaultdict(list)\n",
        "VPT_ratio_dict = defaultdict(list)\n",
        "adev_dict = defaultdict(list)\n",
        "\n",
        "for initial_state in initial_states:\n",
        "    t_vals, chen_traj = generate_chen_data(\n",
        "    initial_state=initial_state,\n",
        "    tmax=tmax,\n",
        "    dt=dt\n",
        "    )\n",
        "\n",
        "    washout = 2000\n",
        "    t_vals = t_vals[washout:]\n",
        "    chen_traj = chen_traj[washout:]\n",
        "\n",
        "    scaler = MinMaxScaler()\n",
        "    scaler.fit(chen_traj)\n",
        "    chen_traj = scaler.transform(chen_traj)\n",
        "    T_data = len(chen_traj)\n",
        "\n",
        "    for train_frac in train_fracs:\n",
        "        train_end = int(train_frac * (T_data - 1))\n",
        "        train_input = chen_traj[:train_end]\n",
        "        train_target = chen_traj[1:train_end + 1]\n",
        "        test_input = chen_traj[train_end:-1]\n",
        "        test_target = chen_traj[train_end + 1:]\n",
        "        n_test_steps = len(test_input)\n",
        "        initial_in = test_input[0]\n",
        "\n",
        "        for seed in seeds:\n",
        "            sw_esn = SWRes3D(\n",
        "                reservoir_size=300,\n",
        "                rewiring_prob=0.3,\n",
        "                degree=6,\n",
        "                spectral_radius=0.99,\n",
        "                input_scale=0.2,\n",
        "                leaking_rate=0.7,\n",
        "                ridge_alpha=1e-5,\n",
        "                seed=seed\n",
        "            )\n",
        "            sw_esn.fit_readout(train_input, train_target, discard=100)\n",
        "            sw_esn_preds = sw_esn.predict_autoregressive(initial_input, num_steps)\n",
        "            sw_esn_nrmse = evaluate_nrmse(sw_esn_preds, test_target, all_horizons)\n",
        "            nrmse_dict['SW-ESN'].append(sw_esn_nrmse)\n",
        "            sw_esn_VPT, sw_esn_VPT_ratio = compute_valid_prediction_time(test_target, sw_esn_preds, test_time, lyapunov_time, VPT_threshold)\n",
        "            VPT_dict['SW-ESN'].append(sw_esn_VPT)\n",
        "            VPT_ratio_dict['SW-ESN'].append(sw_esn_VPT_ratio)\n",
        "            sw_esn_adev = compute_attractor_deviation(sw_esn_preds, test_target)\n",
        "            adev_dict['SW-ESN'].append(sw_esn_adev)\n",
        "\n",
        "print(\"\\nNRMSE for Different Prediction Horizons:\")\n",
        "print(\"-\" * 140)\n",
        "print(f\"{'Horizon':<10} {'SW':<17}\")\n",
        "print(\"-\" * 140)\n",
        "\n",
        "\n",
        "for horizon in horizons:\n",
        "    sw_vals = [np.mean(sw_nrmse[horizon]) for sw_nrmse in nrmse_dict['SW']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [sw_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "8ad200a6",
      "metadata": {
        "id": "8ad200a6"
      },
      "source": [
        "### MITBIH"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "145b026d",
      "metadata": {
        "id": "145b026d"
      },
      "outputs": [],
      "source": [
        "import wfdb\n",
        "\n",
        "# Download and load record and annotations for patient #100\n",
        "record = wfdb.rdrecord('100', sampfrom=0, sampto=25002, pn_dir='mitdb')  # first 20,000 samples\n",
        "annotation = wfdb.rdann('100', 'atr', sampfrom=0, sampto=25002, pn_dir='mitdb')\n",
        "# Get input signal u(t) from the first channel\n",
        "u = record.p_signal[:, 0]\n",
        "u\n",
        "# Normalize input\n",
        "u_min = np.min(u)\n",
        "u_max = np.max(u)\n",
        "u_norm = (u - u_min) / (u_max - u_min)\n",
        "fs = record.fs  # sampling frequency (should be 360 Hz)\n",
        "t_vals = np.arange(len(u_norm)) / fs\n",
        "emb_dim = 3\n",
        "# inputs = u_norm\n",
        "inputs = create_delay_embedding(u_norm, emb_dim)\n",
        "\n",
        "# Create target array (heartbeat locations)\n",
        "targets = np.zeros(len(u_norm))\n",
        "targets[annotation.sample] = 1  # mark annotations as 1 (heartbeat)\n",
        "targets = create_delay_embedding(targets, emb_dim)\n",
        "data_size = len(inputs)\n",
        "train_size = 15000\n",
        "train_input = inputs[:train_size]\n",
        "train_target = targets[:train_size]\n",
        "test_input = inputs[train_size+1:]\n",
        "test_target = targets[train_size+1:]\n",
        "test_size = len(test_input)\n",
        "print(f\"Total samples: {data_size}, train size: {train_size}, test size: {test_size}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "288ea0f6",
      "metadata": {
        "id": "288ea0f6"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "for seed in seeds:\n",
        "    sw_esn = SWRes3D(\n",
        "        reservoir_size=300,\n",
        "        rewiring_prob=0.1,\n",
        "        degree=6,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.7,\n",
        "        ridge_alpha=1e-5,\n",
        "        seed=seed\n",
        "    )\n",
        "    sw_esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    sw_esn_preds = sw_esn.predict_autoregressive(initial_input, num_steps)\n",
        "    sw_esn_nrmse = evaluate_nrmse(sw_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SW-ESN'].append(sw_esn_nrmse)\n",
        "\n",
        "for horizon in horizons:\n",
        "    sw_vals = [np.mean(sw_nrmse[horizon]) for sw_nrmse in nrmse_dict['SW-ESN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [sw_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "7704363f",
      "metadata": {
        "id": "7704363f"
      },
      "source": [
        "### Sunspot"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "47caf31b",
      "metadata": {
        "id": "47caf31b"
      },
      "outputs": [],
      "source": [
        "import pandas as pd\n",
        "file_path = 'dataset/SN_m_tot_V2.0.csv'\n",
        "\n",
        "df = pd.read_csv(file_path, sep=';', header = None)\n",
        "df\n",
        "data = df.iloc[:, 3].values\n",
        "dt = 1\n",
        "dataset_size = len(data)\n",
        "data = create_delay_embedding(data, 3)\n",
        "print(f\"Dataset size: {dataset_size}\")\n",
        "\n",
        "# Train/Test Split\n",
        "train_end = 2000\n",
        "train_input  = data[:train_end]\n",
        "train_target = data[1:train_end+1]\n",
        "test_input   = data[train_end:-1]\n",
        "test_target  = data[train_end+1:]\n",
        "y_test = test_target\n",
        "n_test_steps = len(test_target)\n",
        "time_test = np.arange(n_test_steps) * dt\n",
        "\n",
        "print(f\"Train size: {len(train_input)}\\nTest size: {len(test_input)}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "b2d25498",
      "metadata": {
        "id": "b2d25498"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "for seed in seeds:\n",
        "    sw_esn = SWRes3D(\n",
        "        reservoir_size=300,\n",
        "        rewiring_prob=0.1,\n",
        "        degree=6,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.7,\n",
        "        ridge_alpha=1e-5,\n",
        "        seed=seed\n",
        "    )\n",
        "    sw_esn.fit_readout(train_input, train_target, discard=100)\n",
        "    sw_esn_preds = sw_esn.predict_autoregressive(initial_input, num_steps)\n",
        "    sw_esn_nrmse = evaluate_nrmse(sw_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SW-ESN'].append(sw_esn_nrmse)\n",
        "\n",
        "for horizon in horizons:\n",
        "    sw_vals = [np.mean(sw_nrmse[horizon]) for sw_nrmse in nrmse_dict['SW-ESN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [sw_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "0cc6d7bf",
      "metadata": {
        "id": "0cc6d7bf"
      },
      "source": [
        "### Santa Fe"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "5c039c73",
      "metadata": {
        "id": "5c039c73"
      },
      "outputs": [],
      "source": [
        "import pandas as pd\n",
        "\n",
        "file_path = 'dataset/santa-fe-time-series/b1.txt'\n",
        "\n",
        "df = pd.read_csv(file_path, header=None, sep=' ')\n",
        "df\n",
        "# Normalize the first column (column 0) of the DataFrame\n",
        "df[0] = (df[0] - df[0].min()) / (df[0].max() - df[0].min()) \n",
        "data = df.iloc[:, 0].values\n",
        "chosen_system = \"SantaFe\"\n",
        "dt = 1\n",
        "T_data = len(data)\n",
        "data = create_delay_embedding(data, 3)\n",
        "print(f\"Data length: {T_data}.\")\n",
        "\n",
        "# Train/Test Split\n",
        "train_end = 7000\n",
        "train_input  = data[:train_end]\n",
        "train_target = data[1:train_end+1]\n",
        "test_input   = data[train_end:-1]\n",
        "test_target  = data[train_end+1:]\n",
        "y_test = test_target\n",
        "n_test_steps = len(test_target)\n",
        "time_test = np.arange(n_test_steps) * dt\n",
        "\n",
        "print(f\"Train size: {len(train_input)}  \\nTest size: {len(test_input)}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "3782545d",
      "metadata": {
        "id": "3782545d"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "for seed in seeds:\n",
        "    sw_esn = SWRes3D(\n",
        "        reservoir_size=300,\n",
        "        rewiring_prob=0.1,\n",
        "        degree=6,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.7,\n",
        "        ridge_alpha=1e-5,\n",
        "        seed=seed\n",
        "    )\n",
        "    sw_esn.fit_readout(train_input, train_target, discard=100)\n",
        "    sw_esn_preds = sw_esn.predict_autoregressive(initial_input, num_steps)\n",
        "    sw_esn_nrmse = evaluate_nrmse(sw_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SW-ESN'].append(sw_esn_nrmse)\n",
        "\n",
        "for horizon in horizons:\n",
        "    sw_vals = [np.mean(sw_nrmse[horizon]) for sw_nrmse in nrmse_dict['SW-ESN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [sw_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    },
    {
      "cell_type": "markdown",
      "id": "9d66f28e",
      "metadata": {
        "id": "9d66f28e"
      },
      "source": [
        "### BIDMC"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "235532bf",
      "metadata": {
        "id": "235532bf"
      },
      "outputs": [],
      "source": [
        "# ─── Load BIDMC Record ─────────────────────────────────────────────────────\n",
        "record_id = 'bidmc01'\n",
        "record = wfdb.rdrecord(record_id, pn_dir='bidmc', sampto=8 * 60 * 125)  # 8 mins at 125Hz\n",
        "signals = record.p_signal  # shape: (60000, 5)\n",
        "names = [n.strip().strip(',') for n in record.sig_name]\n",
        "# ─── Get Indices of ECG Lead II and RESP ──────────────────────────────────\n",
        "idx_ecg = names.index('II')     # ECG Lead II\n",
        "idx_resp = names.index('RESP')  # Respiration signal\n",
        "# ─── Parameters ────────────────────────────────────────────────────────────\n",
        "N_train = 10000\n",
        "N_test = 5000\n",
        "emb_dim = 3\n",
        "# ─── Select Signals ────────────────────────────────────────────────────────\n",
        "u = signals[:, idx_ecg]   # input: ECG Lead II\n",
        "v = signals[:, idx_resp]  # target: RESP\n",
        "# ─── Normalize to [-1, 1] ──────────────────────────────────────────────────\n",
        "u_norm = 2 * (u - np.min(u)) / (np.max(u) - np.min(u)) - 1\n",
        "v_norm = 2 * (v - np.min(v)) / (np.max(v) - np.min(v)) - 1\n",
        "# ─── Delay Embedding ───────────────────────────────────────────────────────\n",
        "inputs = create_delay_embedding(u_norm, emb_dim)\n",
        "targets = create_delay_embedding(v_norm, emb_dim)\n",
        "# ─── Train/Test Split ──────────────────────────────────────────────────────\n",
        "train_input = inputs[:N_train]\n",
        "train_target = targets[:N_train]\n",
        "test_input = inputs[N_train:N_train+N_test]\n",
        "test_target = targets[N_train:N_train+N_test]\n",
        "# ─── Summary ───────────────────────────────────────────────────────────────\n",
        "print(f\"Train input shape:  {train_input.shape}\")\n",
        "print(f\"Train target shape: {train_target.shape}\")\n",
        "print(f\"Test input shape:   {test_input.shape}\")\n",
        "print(f\"Test target shape:  {test_target.shape}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "id": "e9ea51bf",
      "metadata": {
        "id": "e9ea51bf"
      },
      "outputs": [],
      "source": [
        "all_horizons = list(range(10, 1001, 10))\n",
        "\n",
        "nrmse_dict = defaultdict(list)\n",
        "seeds = range(995, 1025)\n",
        "\n",
        "for seed in seeds:\n",
        "    sw_esn = SWRes3D(\n",
        "        reservoir_size=300,\n",
        "        rewiring_prob=0.1,\n",
        "        degree=6,\n",
        "        spectral_radius=0.99,\n",
        "        input_scale=0.2,\n",
        "        leaking_rate=0.7,\n",
        "        ridge_alpha=1e-5,\n",
        "        seed=seed\n",
        "    )\n",
        "    sw_esn.fit_readout(train_input, train_target, discard=5000)\n",
        "    sw_esn_preds = sw_esn.predict_autoregressive(initial_input, num_steps)\n",
        "    sw_esn_nrmse = evaluate_nrmse(sw_esn_preds, test_target, all_horizons)\n",
        "    nrmse_dict['SW-ESN'].append(sw_esn_nrmse)\n",
        "\n",
        "for horizon in horizons:\n",
        "    sw_vals = [np.mean(sw_nrmse[horizon]) for sw_nrmse in nrmse_dict['SW-ESN']]\n",
        "\n",
        "    print(f\"{horizon:<10}\", end=\" \")\n",
        "    for vals in [sw_vals]:\n",
        "        mean = np.mean(vals)\n",
        "        std = np.std(vals)\n",
        "        print(f\"{mean:.4f} ± {std:.4f}\".ljust(18), end=\"\")\n",
        "    print()"
      ]
    }
  ],
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "display_name": "Python 3",
      "language": "python",
      "name": "python3"
    },
    "language_info": {
      "codemirror_mode": {
        "name": "ipython",
        "version": 3
      },
      "file_extension": ".py",
      "mimetype": "text/x-python",
      "name": "python",
      "nbconvert_exporter": "python",
      "pygments_lexer": "ipython3",
      "version": "3.13.3"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 5
}
