{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "539ebd7b",
   "metadata": {},
   "outputs": [],
   "source": [
    "###This code is about develop a RNN model for the target CSTR process using heterogeneous transfer learning\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from sklearn import preprocessing\n",
    "from sklearn.model_selection import train_test_split\n",
    "from sklearn.metrics import mean_absolute_percentage_error\n",
    "from keras.models import Sequential\n",
    "from keras.layers import LSTM, Dense, SimpleRNN, Input, Activation, Dropout\n",
    "from keras import backend as K\n",
    "from tensorflow.keras.optimizers import Adam,SGD\n",
    "import tensorflow as tf\n",
    "from keras.models import Model\n",
    "from keras.models import load_model\n",
    "import time "
   ]
  },
  {
   "cell_type": "markdown",
   "id": "069e2e34",
   "metadata": {},
   "source": [
    "# Generate Target dataset"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "3a4a2d8e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "number of initial conditions: 242\n",
      "(1, 242)\n",
      "shape of x_deviation is (242, 2)\n",
      "(242, 2)\n"
     ]
    }
   ],
   "source": [
    "# specifying constant parameters\n",
    "#input varioable: Q, C_A0\n",
    "#state variable: T, C_A\n",
    "\n",
    "T_0 = 300\n",
    "V = 1\n",
    "k_0 = 8.46*(np.power(10,6))\n",
    "C_p = 0.231\n",
    "rho_L = 1000\n",
    "F = 5\n",
    "E = 5*(np.power(10,4))\n",
    "delta_H = -1.15*(np.power(10,4))\n",
    "R = 8.314\n",
    "\n",
    "C_A0s = 4   # the steady state for input variable C_A0\n",
    "Q_s = 0.0  # the steady state for input variable Q\n",
    "\n",
    "C_As = 1.95 # the steady state for state variable C_A\n",
    "T_s = 402  # the steady state for state variable T\n",
    "\n",
    "t_final = 0.01  #the control period\n",
    "t_step = 1e-4   # the step to use first-principle to calculate the state\n",
    "P = np.array([[1060, 22], [22, 0.52]])\n",
    "\n",
    "# generating inputs and initial states for CSTR, all expressed in deviation form\n",
    "\n",
    "u1_list = np.linspace(-3.5, 3.5, 10, endpoint=True)\n",
    "u2_list = np.linspace(-5e5, 5e5, 10, endpoint=True)\n",
    "T_initial = np.linspace(300, 550, 40, endpoint=True) - T_s\n",
    "CA_initial = np.linspace(1, 4., 40, endpoint=True) - C_As    # CA and T must be >0\n",
    "\n",
    "\n",
    "# sieve out initial states that lie outside of stability region\n",
    "\n",
    "T_start = list()\n",
    "CA_start = list()\n",
    "\n",
    "for T in T_initial:   \n",
    "    for CA in CA_initial:\n",
    "        x = np.array([CA, T])\n",
    "        if x @ P @ x < 368:   #calculate the stability region for state \n",
    "            CA_start.append(CA)\n",
    "            T_start.append(T)\n",
    "print(\"number of initial conditions: {}\".format(len(CA_start)))\n",
    "\n",
    "# convert to np.arrays\n",
    "CA_start = np.array([CA_start])\n",
    "T_start = np.array([T_start])\n",
    "print(CA_start.shape)\n",
    "x_deviation = np.concatenate((CA_start.T, T_start.T), axis=1)  # every row is a pair of initial states within stability region\n",
    "print(\"shape of x_deviation is {}\".format(x_deviation.shape))\n",
    "print(x_deviation.shape) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "16075e8a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def CSTR_simulation(F, V, C_A0, k_0, E, R, T_0, delta_H, rho_L, C_p, Q, t_final, t_step, C_A_initial, T_initial):\n",
    "    \"\"\"\n",
    "        simulating CSTR using forward Euler method\n",
    "    \"\"\"\n",
    "    \n",
    "    C_A_list = list()  # evolution of CA over time\n",
    "    T_list = list()  # evolution of T over time\n",
    "    \n",
    "    C_A = C_A_initial + C_As  # the real state.the derivation plus the steady state\n",
    "    T = T_initial + T_s\n",
    "    \n",
    "    for i in range(int(t_final / t_step)):\n",
    "        dCAdt = F / V * (C_A0 - C_A) - k_0 * np.exp(-E / (R * T)) * C_A**2\n",
    "        dTdt = F / V * (T_0 - T) - delta_H / (rho_L * C_p) * k_0 * np.exp(-E / (R * T)) * C_A**2 + Q / (rho_L * C_p * V)\n",
    "        \n",
    "        C_A += dCAdt * t_step\n",
    "        T += dTdt * t_step\n",
    "        \n",
    "        if i%10 ==0:\n",
    "            C_A_list.append(C_A - C_As)  # in deviation form\n",
    "            T_list.append(T - T_s)  # in deviation form \n",
    "    \n",
    "    return C_A_list, T_list"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "b400bf04",
   "metadata": {},
   "outputs": [],
   "source": [
    "# get X and y data for training and testing\n",
    "\n",
    "CA_output = list()\n",
    "T_output = list()\n",
    "\n",
    "CA_input = list()\n",
    "T_input = list()\n",
    "CA0_input = list()\n",
    "Q_input = list()  \n",
    "\n",
    "for u1 in u1_list:\n",
    "    C_A0 = u1 + C_A0s\n",
    "    \n",
    "    for u2 in u2_list:\n",
    "        Q = u2 + Q_s\n",
    "        \n",
    "        for C_A_initial, T_initial in x_deviation:\n",
    "            CA0_input.append(u1)\n",
    "            Q_input.append(u2)\n",
    "            CA_input.append(C_A_initial)\n",
    "            T_input.append(T_initial)\n",
    "            \n",
    "            C_A_list, T_list = CSTR_simulation(F, V, C_A0, k_0, E, R, T_0, delta_H, rho_L, C_p, Q, t_final, t_step, C_A_initial, T_initial)\n",
    "            CA_output.append(C_A_list)\n",
    "            T_output.append(T_list)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "d18fd7d5",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "RNN_input shape is (24200, 1, 4)\n",
      "RNN_input shape is (24200, 10, 4)\n",
      "RNN_output shape is (24200, 10, 2)\n"
     ]
    }
   ],
   "source": [
    "# collate input for RNN\n",
    "\n",
    "CA0_input = np.array(CA0_input)\n",
    "CA0_input = CA0_input.reshape(-1,1,1)\n",
    "\n",
    "Q_input = np.array(Q_input)\n",
    "Q_input = Q_input.reshape(-1,1,1)\n",
    "\n",
    "CA_input = np.array(CA_input)\n",
    "CA_input = CA_input.reshape(-1,1,1)\n",
    "\n",
    "T_input = np.array(T_input)\n",
    "T_input = T_input.reshape(-1,1,1)\n",
    "\n",
    "RNN_input = np.concatenate((T_input, CA_input, Q_input, CA0_input), axis=2)   #the value for input variable and the initial value for state variable \n",
    "\n",
    "\"\"\"\n",
    "    the input to RNN is in the shape [number of samples x timestep x variables], and the input variables are same for every\n",
    "    time step, not sure if my treatment here is correct\n",
    "\"\"\"\n",
    "print(\"RNN_input shape is {}\".format(RNN_input.shape))\n",
    "RNN_input = RNN_input.repeat(10, axis=1)  \n",
    "print(\"RNN_input shape is {}\".format(RNN_input.shape))\n",
    "\n",
    "# collate output for RNN\n",
    "\n",
    "CA_output = np.array(CA_output)\n",
    "CA_output = CA_output.reshape(-1, 10, 1)\n",
    "\n",
    "T_output = np.array(T_output)\n",
    "T_output = T_output.reshape(-1, 10, 1)\n",
    "\n",
    "RNN_output = np.concatenate((CA_output,T_output), axis=2)\n",
    "print(\"RNN_output shape is {}\".format(RNN_output.shape))  # output shape: number of samples x timestep x variables"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "aa5fda0a",
   "metadata": {},
   "source": [
    "# normalization using scalers for each process, due to different features"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "c4172f79",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(24, 10, 4) (24176, 10, 4) (24, 10, 2) (24176, 10, 2)\n"
     ]
    }
   ],
   "source": [
    "#target data\n",
    "X_train, X_test, y_train, y_test = train_test_split(RNN_input, RNN_output, test_size=0.999, random_state=123)\n",
    "\n",
    "# define scalers for both X and y base on training data only\n",
    "scaler_X = preprocessing.StandardScaler().fit(X_train.reshape(-1, 4))\n",
    "scaler_y = preprocessing.StandardScaler().fit(y_train.reshape(-1, 2))\n",
    "\n",
    "X_train = scaler_X.transform(X_train.reshape(-1, 4)).reshape(-1,10,4)\n",
    "X_test = scaler_X.transform(X_test.reshape(-1, 4)).reshape(-1,10,4)\n",
    "y_train = scaler_y.transform(y_train.reshape(-1,2)).reshape(-1,10,2)\n",
    "y_test = scaler_y.transform(y_test.reshape(-1,2)).reshape(-1,10,2)\n",
    "\n",
    "print(X_train.shape, X_test.shape, y_train.shape, y_test.shape)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "b1f81109",
   "metadata": {},
   "source": [
    "# Develop the pre-trained model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "25925acb",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "2025-06-13 16:55:08.137360: E tensorflow/stream_executor/cuda/cuda_driver.cc:271] failed call to cuInit: CUDA_ERROR_NO_DEVICE: no CUDA-capable device is detected\n",
      "2025-06-13 16:55:08.137418: I tensorflow/stream_executor/cuda/cuda_diagnostics.cc:156] kernel driver does not appear to be running on this host (wulab2-System-Product-Name): /proc/driver/nvidia/version does not exist\n",
      "2025-06-13 16:55:08.138485: I tensorflow/core/platform/cpu_feature_guard.cc:151] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 AVX512F FMA\n",
      "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "36/36 - 1s - loss: 0.5447 - mse: 0.5447 - val_loss: 0.2914 - val_mse: 0.2914 - 537ms/epoch - 15ms/step\n",
      "Epoch 2/2\n",
      "36/36 - 0s - loss: 0.2402 - mse: 0.2402 - val_loss: 0.2026 - val_mse: 0.2026 - 62ms/epoch - 2ms/step\n",
      "0.6627440452575684\n"
     ]
    }
   ],
   "source": [
    "###the standard RNN model is trained as benchmark, to show the priority of transfer learning RNN models\n",
    "model = Sequential()\n",
    "model.add(SimpleRNN(16, activation='tanh', return_sequences=True))\n",
    "model.add(Dense(2, activation='linear'))\n",
    "model.compile(optimizer='adam', loss='mse', metrics=['mse'])\n",
    "\n",
    "t0 = time.time()\n",
    "history = model.fit(X_train_S, y_train_S, epochs=2, batch_size=256, validation_split=0.25, verbose=2)\n",
    "t1 = time.time()\n",
    "print(t1-t0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "81f35c9a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "48/48 [==============================] - 0s 758us/step - loss: 0.2008 - mse: 0.2008\n",
      "[0.20078706741333008, 0.20078709721565247]\n",
      "0.6627440452575684\n"
     ]
    }
   ],
   "source": [
    "#use the SOURCE test data to evaluate the model\n",
    "loss_and_metrics = model.evaluate(X_test_S, y_test_S, batch_size=256)\n",
    "print(loss_and_metrics)\n",
    "\n",
    "print(t1-t0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "ef7b115a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "95/95 [==============================] - 0s 705us/step - loss: 3.6427 - mse: 3.6427\n",
      "[3.6427011489868164, 3.642699956893921]\n",
      "0.6627440452575684\n"
     ]
    }
   ],
   "source": [
    "#use the TARGET test data to evaluate the model\n",
    "loss_and_metrics = model.evaluate(X_test, y_test, batch_size=256)\n",
    "print(loss_and_metrics)\n",
    "\n",
    "print(t1-t0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "364b1d8c",
   "metadata": {},
   "outputs": [],
   "source": [
    "model.save(\"pretrained_model.h5\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f9ed7589",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
