{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "d034bdc6",
   "metadata": {},
   "outputs": [],
   "source": [
    "#Load required packages\n",
    "import pandas\n",
    "import random\n",
    "import numpy as np\n",
    "from numpy import loadtxt\n",
    "from numpy import savetxt\n",
    "import tensorflow as tf\n",
    "from keras.models import Sequential\n",
    "from keras.layers import Dense\n",
    "from keras.wrappers.scikit_learn import KerasRegressor\n",
    "from sklearn.model_selection import cross_validate\n",
    "from sklearn.model_selection import KFold\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "from sklearn.pipeline import Pipeline\n",
    "import matplotlib.pyplot as plt\n",
    "from matplotlib.patches import Patch\n",
    "from matplotlib.lines import Line2D"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "c0d6992a",
   "metadata": {},
   "outputs": [],
   "source": [
    "#Create data\n",
    "# Pick 10000 points beta on SO(3) uniformly at random\n",
    "R = np.random.rand(10000,1)*np.pi\n",
    "# First column of X corresponds to the trivial character\n",
    "X = np.ones((10000,1))\n",
    "# Each column X now consists of the first 22 lowest order irrdeucible character\n",
    "for k in range(21):\n",
    "    X = np.append(X,np.sin((k+1.5)*R)/np.sin(0.5*R), axis=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "54891fae",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Input alphabet for neural network is half the size of that for linear regression. \n",
    "# Pick first 11 columns \n",
    "Xnn = X[:,range(11)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "599b1547",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Generating basis of 10 indicator functions\n",
    "B = np.zeros((10000,10))\n",
    "for k in range(10):\n",
    "    L = np.all( [0.1*np.pi*k<R, R<0.1*np.pi*k + 0.12*np.pi], axis=0)\n",
    "    B[:,k] = np.where(L.reshape(10000,), 1, 0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "325eeaea",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Create 10x100 Gaussian to post multiply by B, outputting a 10000x100 matrix\n",
    "# Each column corresponding to a class function to be learned\n",
    "G = np.random.normal(loc=0.0, scale=1.0, size=(10,100))\n",
    "Y = np.dot(B,G)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "beee7d64",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Our neural network model of depth 6\n",
    "def NN6_model():\n",
    "\t# create model\n",
    "\tmodel = Sequential()\n",
    "\tmodel.add(Dense(180, input_dim=11, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(3e-7), activation='relu'))\n",
    "\tmodel.add(Dense(150, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(3e-7), activation='relu'))\n",
    "\tmodel.add(Dense(100, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(3e-7), activation='relu'))\n",
    "\tmodel.add(Dense(60, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(3e-7), activation='relu'))\n",
    "\tmodel.add(Dense(35, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(3e-7), activation='relu'))\n",
    "\tmodel.add(Dense(10, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(3e-7), activation='relu'))\n",
    "\tmodel.add(Dense(1, kernel_initializer='normal'))     \n",
    "\t# Compile model\n",
    "\tmodel.compile(loss='mean_squared_error', optimizer= 'Adamax')\n",
    "\treturn model\n",
    "NN6_model().summary()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "df15e94c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Evaluate NN6 using 10 folds\n",
    "estimator = []\n",
    "estimator.append(('standardize', StandardScaler()))\n",
    "estimator.append(('mlp', KerasRegressor(build_fn=NN6_model, epochs=250, batch_size=500, verbose=1)))\n",
    "pipeline = Pipeline(estimator)\n",
    "kfold = KFold(n_splits=10)\n",
    "scoring = {'MSE': 'neg_mean_squared_error'}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ed0316b9",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Creates an empty array to be appended with 10 dimensional column vectors\n",
    "NN6losses = [[] for _ in range(10)]\n",
    "\n",
    "# For loop that adds a class function to be trained for each iteration\n",
    "for k in range(100):\n",
    "    scoreNN6 = cross_validate(pipeline, Xnn, Y[:,k], cv=kfold, scoring = scoring, \n",
    "                     return_train_score=True,  return_estimator=True)\n",
    "    TempLossNN6 = scoreNN6['test_MSE']\n",
    "    # Collect the losses for each class function in a new column\n",
    "    NN6losses = np.append(NN6losses, TempLossNN6.reshape((10,1)), axis=1)\n",
    "    #save results\n",
    "    savetxt('NN6losses.csv' , NN6losses, delimiter=\",\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "afc08839",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Our neural network model\n",
    "def NN3_model():\n",
    "\t# create model\n",
    "\tmodel = Sequential()\n",
    "\tmodel.add(Dense(150, input_dim=11, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(0.0000003), activation='relu'))\n",
    "\tmodel.add(Dense(100, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(0.0000003), activation='relu'))\n",
    "\tmodel.add(Dense(50, kernel_initializer='normal', kernel_regularizer=tf.keras.regularizers.l2(0.0000003), activation='relu'))\n",
    "\tmodel.add(Dense(1, kernel_initializer='normal'))     \n",
    "\t# Compile model\n",
    "\tmodel.compile(loss='mean_squared_error', optimizer= 'Adamax')\n",
    "\treturn model\n",
    "#NN3_model().summary()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "3ebed0a1",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Evaluate NN3 using 10 folds\n",
    "estimator = []\n",
    "estimator.append(('standardize', StandardScaler()))\n",
    "estimator.append(('mlp', KerasRegressor(build_fn=NN3_model, epochs=350, batch_size=500, verbose=1)))\n",
    "pipeline = Pipeline(estimator)\n",
    "kfold = KFold(n_splits=10)\n",
    "scoring = {'MSE': 'neg_mean_squared_error'}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dea00e7f",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Creates an empty array to be appended with 10 dimensional column vectors\n",
    "NN3losses = [[] for _ in range(10)]\n",
    "\n",
    "# For loop that adds a class function to be trained for each iteration\n",
    "for k in range(100):\n",
    "    scoreNN3 = cross_validate(pipeline, Xnn, Y[:,k], cv=kfold, scoring = scoring, \n",
    "                     return_train_score=True,  return_estimator=True)\n",
    "    TempLossNN3 = scoreNN3['test_MSE']\n",
    "    # Collect the losses for each class function in a new column\n",
    "    NN3losses = np.append(NN6losses, TempLossNN3.reshape((10,1)), axis=1)\n",
    "    #save results\n",
    "    savetxt('NN3losses.csv' , NN3losses, delimiter=\",\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "a9dfecc2",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Linear model\n",
    "def Linear_model():\n",
    "\t# create model\n",
    "\tmodel = Sequential()\n",
    "\tmodel.add(Dense(1, input_dim=22, kernel_initializer='normal'))\n",
    "\t# Compile model\n",
    "\tmodel.compile(loss='mean_squared_error', optimizer= 'Adamax')\n",
    "\treturn model\n",
    "Linear_model().summary()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "37c75114",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Evaluate linear model using 10 folds\n",
    "estimator = []\n",
    "estimator.append(('standardize', StandardScaler()))\n",
    "estimator.append(('mlp', KerasRegressor(build_fn=Linear_model, epochs=80, batch_size=100, verbose=1)))\n",
    "pipeline = Pipeline(estimator)\n",
    "kfold = KFold(n_splits=10)\n",
    "scoring = {'MSE': 'neg_mean_squared_error'}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7ebf6e9c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Creates an empty array to be appended with 10 dimensional column vectors\n",
    "Linearlosses = [[] for _ in range(10)]\n",
    "\n",
    "# For loop that adds a class function to be trained for each iteration\n",
    "for k in range(100):\n",
    "    scoreLinear = cross_validate(pipeline, X, Y[:,k], cv=kfold, scoring = scoring, \n",
    "                     return_train_score=True,  return_estimator=True)\n",
    "    TempLossLinear = scoreLinear['test_MSE']\n",
    "    Linearlosses = np.append(Linearlosses, TempLossLinear.reshape((10,1)), axis=1)\n",
    "    #save results\n",
    "    savetxt('Linearlosses.csv' , Linearlosses, delimiter=\",\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ee788b1a",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Create Scatter Plots\n",
    "plt.scatter(np.std(NN6losses, axis =0), -np.mean(NN6losses, axis = 0), c=\"blue\")\n",
    "plt.scatter(np.std(NN3losses, axis =0), -np.mean(NN3losses, axis = 0), c=\"red\")\n",
    "plt.scatter(np.std(Linearlosses, axis =0), -np.mean(Linearlosses, axis = 0), c=\"green\")\n",
    "plt.title(\"Discontinuous class function learning performance\")\n",
    "plt.xlabel(\"Standard Deviation over 10 folds\")\n",
    "plt.ylabel(\"Mean over 10 folds of MSE\")\n",
    "legend_elements = [Line2D([0], [0], marker='o', color='w', label='NN6',\n",
    "                          markerfacecolor='b', markersize=8),\n",
    "                   Line2D([0], [0], marker='o', color='w', label='NN3',\n",
    "                          markerfacecolor='r', markersize=8),\n",
    "                Line2D([0], [0], marker='o', color='w', label='Linear Regression',\n",
    "                          markerfacecolor='g', markersize=8),]                 \n",
    "plt.legend(handles=legend_elements)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e4a945ce",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Create Histogram\n",
    "plt.hist(-np.mean(NN6losses,axis =0), histtype='stepfilled', alpha=0.3, bins=10)\n",
    "plt.hist(-np.mean(NN3losses,axis =0), histtype='stepfilled', alpha=0.3, bins=10)\n",
    "plt.hist(-np.mean(Linearlosses,axis =0), histtype='stepfilled', alpha=0.3, bins=10);\n",
    "plt.title(\"Discontinuous class function learning performance\")\n",
    "plt.xlabel(\"Mean MSE over 10 folds\")\n",
    "plt.ylabel(\"Frequency\")\n",
    "legend_elements = [Patch(facecolor='blue', edgecolor='b',\n",
    "                        label='NN6 mean  '+ str(round(-np.mean(NN6losses,axis =0).mean(),6))),\n",
    "                   Patch(facecolor='red', edgecolor='r',\n",
    "                        label='NN3 mean  '+ str(round(-np.mean(NN3losses,axis =0).mean(),6))),\n",
    "                   Patch(facecolor='green', edgecolor='g',\n",
    "                        label='Linear Regression mean  '+ str(round(-np.mean(Linearlosses,axis =0).mean(),6))),]\n",
    "plt.legend(handles=legend_elements)\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
