{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Working example of GLAD \n",
    "Fitting GLAD on a single random sparse graph with samples obtained from a corresponding multivariate Gaussian distribution"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/root/anaconda3/envs/glad\n"
     ]
    }
   ],
   "source": [
    "import os, sys\n",
    "# reloads modules automatically before entering the \n",
    "# execution of code typed at the IPython prompt.\n",
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "# install jupyter-notebook in the env if the prefix does not \n",
    "# show the desired virtual env. \n",
    "print(sys.prefix)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Pytorch version  1.4.0\n",
      "networkx version  2.5\n"
     ]
    }
   ],
   "source": [
    "# importing required modules: Python 3 used. \n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import torch\n",
    "print('Pytorch version ', torch.__version__)\n",
    "import sys\n",
    "import scipy\n",
    "import networkx as nx\n",
    "print('networkx version ', nx.__version__)\n",
    "import copy, random\n",
    "import matplotlib.pyplot as plt\n",
    "from glad import glad\n",
    "from glad_model import glad_model\n",
    "import torch.nn as nn\n",
    "from metrics import report_metrics\n",
    "import warnings\n",
    "warnings.filterwarnings('ignore')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Initialize the parameters"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# initializing basic params\n",
    "D = 10 # Dimension of graph\n",
    "sparsity = 0.2 # erdos-renyi sparsity of true precision matrix\n",
    "w_max, w_min = 0.5, 1 # sample true precision matrix entries ~U[w_min, w_max] \n",
    "sample_size = 500 # Number of samples from the true graph\n",
    "lr_glad = 0.03 # Learning rate of GLAD\n",
    "use_optimizer = 'adam' # Optimizer\n",
    "INIT_DIAG = 0 # Initialize as (S + theta_init_offset * I)^-1\n",
    "lambda_init = 1 # Initial lambda value\n",
    "L = 15 # Number of unrolled iterations"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Preparing the input data & output precision matrix"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "# initializing precision matrix\n",
    "def get_sparsity_pattern(seed=None):\n",
    "    if seed != None:\n",
    "        np.random.seed(seed)\n",
    "    prob = sparsity\n",
    "    G = nx.generators.random_graphs.gnp_random_graph(D, prob, seed=seed, directed=False)\n",
    "    edge_connections = nx.adjacency_matrix(G).todense() # adjacency matrix\n",
    "    return edge_connections\n",
    "\n",
    "# Get the input data and corresponding output true precision matrix for training\n",
    "def get_samples(edge_connections, seed=None, u=0.1): # mean = 0\n",
    "    mean_value = 0 # zero mean of Gaussian distribution\n",
    "    mean_normal = np.ones(D) * mean_value\n",
    "    if seed != None:\n",
    "        np.random.seed(seed)\n",
    "        \n",
    "    # uniform [w_min, w_max]\n",
    "    U = np.matrix(np.random.random((D, D)) * (w_max - w_min) + w_min)\n",
    "    theta = np.multiply(edge_connections, U)\n",
    "    # making it symmetric\n",
    "    theta = (theta + theta.T)/2 + np.eye(D)\n",
    "    smallest_eigval = np.min(np.linalg.eigvals(theta))\n",
    "    # Just in case : to avoid numerical error in case a epsilon complex component present\n",
    "    smallest_eigval = smallest_eigval.real\n",
    "    # making the min eigenvalue as u\n",
    "    precision_mat = theta + np.eye(D)*(u - smallest_eigval)\n",
    "    print('Smallest eigenvalue = ', np.min(np.linalg.eigvals(precision_mat)))\n",
    "    \n",
    "    cov = np.linalg.inv(precision_mat) # avoiding the use of pinv as data not true representative of conditional independencies.\n",
    "    # get the samples \n",
    "    if seed != None:\n",
    "        np.random.seed(seed)\n",
    "    # Sampling data from multivariate normal distribution\n",
    "    data = np.random.multivariate_normal(mean=mean_normal, cov=cov, size=sample_size)\n",
    "    print('data: ', data.shape, ' theta: ', theta.shape)\n",
    "    return data, precision_mat # MxD, DxD"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Smallest eigenvalue =  0.10000000000000087\n",
      "data:  (500, 10)  theta:  (10, 10)\n"
     ]
    }
   ],
   "source": [
    "# from prepare_data import get_sparsity_pattern, get_samples\n",
    "# # print(dir(prepare_data))\n",
    "edge_connections = get_sparsity_pattern() # the adjacency matrix\n",
    "X, theta_true = get_samples(edge_connections) # input data = X, output true precision matrix = theta_true\n",
    "#print('Check: ', X, theta_true)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Training the glad"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "# helper functions \n",
    "USE_CUDA = False\n",
    "def convert_to_torch(data, TESTING_FLAG=False, USE_CUDA=USE_CUDA):# convert from numpy to torch variable \n",
    "    if USE_CUDA == False:\n",
    "        data = torch.from_numpy(data.astype(np.float, copy=False)).type(torch.FloatTensor)\n",
    "        if TESTING_FLAG == True:\n",
    "            data.requires_grad = False\n",
    "    else: # On GPU\n",
    "        if TESTING_FLAG == False:\n",
    "            data = torch.from_numpy(data.astype(np.float, copy=False)).type(torch.FloatTensor).cuda()\n",
    "        else: # testing phase, no need to store the data on the GPU\n",
    "            data = torch.from_numpy(data.astype(np.float, copy=False)).type(torch.FloatTensor).cuda()\n",
    "            data.requires_grad = False\n",
    "    return data\n",
    "\n",
    "def get_optimizers(model_glad):\n",
    "    lrG = lr_glad\n",
    "    if use_optimizer == 'adam':\n",
    "        optimizer_glad = torch.optim.Adam(model_glad.parameters(), lr=lrG, betas=(0.9, 0.999), eps=1e-08, weight_decay=0)\n",
    "    else:\n",
    "        print('Optimizer not found!')\n",
    "    return optimizer_glad\n",
    "criterion_graph = nn.MSELoss()\n",
    "# Consider that all the data can be shifted to GPU\n",
    "X = convert_to_torch(X)\n",
    "theta_true = convert_to_torch(theta_true, TESTING_FLAG=True)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Training GLAD using supervision"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "epoch:  0  loss:  0.19022478\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "nan 0.0 0.0 8.0 8.0 0.0 nan 0.0 0.0 0.178 0.5\n",
      "epoch:  1  loss:  0.17156953\n",
      "epoch:  2  loss:  0.14752331\n",
      "epoch:  3  loss:  0.11952779\n",
      "epoch:  4  loss:  0.09275508\n",
      "epoch:  5  loss:  0.06839868\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "0.0 1.0 0.0 0.0 8.0 8.0 1.0 1.0 1.0 1.0 1.0\n",
      "epoch:  6  loss:  0.049231812\n",
      "epoch:  7  loss:  0.038904343\n",
      "epoch:  8  loss:  0.03514349\n",
      "epoch:  9  loss:  0.027933873\n",
      "epoch:  10  loss:  0.020603932\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "0.0 1.0 0.0 0.0 8.0 8.0 1.0 1.0 1.0 1.0 1.0\n",
      "epoch:  11  loss:  0.01518403\n",
      "epoch:  12  loss:  0.011571886\n",
      "epoch:  13  loss:  0.009186978\n",
      "epoch:  14  loss:  0.0075738896\n",
      "epoch:  15  loss:  0.006446015\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "0.0 1.0 0.0 0.0 8.0 8.0 1.0 1.0 1.0 1.0 1.0\n",
      "epoch:  16  loss:  0.0056362622\n",
      "epoch:  17  loss:  0.0050434275\n",
      "epoch:  18  loss:  0.0046049035\n",
      "epoch:  19  loss:  0.004271282\n",
      "epoch:  20  loss:  0.004013631\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "0.2 1.0 0.054 2.0 8.0 10.0 0.8 1.0 0.889 1.0 1.0\n",
      "epoch:  21  loss:  0.0038124963\n",
      "epoch:  22  loss:  0.0036544295\n",
      "epoch:  23  loss:  0.0035316444\n",
      "epoch:  24  loss:  0.0034361067\n",
      "epoch:  25  loss:  0.003361637\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "0.529 1.0 0.243 9.0 8.0 17.0 0.471 1.0 0.64 1.0 1.0\n",
      "epoch:  26  loss:  0.0033035744\n",
      "epoch:  27  loss:  0.0032584274\n",
      "epoch:  28  loss:  0.0032241829\n",
      "epoch:  29  loss:  0.0031980337\n",
      "epoch:  30  loss:  0.0031783634\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "0.579 1.0 0.297 11.0 8.0 19.0 0.421 1.0 0.593 1.0 1.0\n",
      "epoch:  31  loss:  0.0031635375\n",
      "epoch:  32  loss:  0.0031526326\n",
      "epoch:  33  loss:  0.0031446493\n",
      "epoch:  34  loss:  0.0031389531\n",
      "epoch:  35  loss:  0.003134932\n",
      ": Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc \n",
      "0.636 1.0 0.378 14.0 8.0 22.0 0.364 1.0 0.533 1.0 1.0\n",
      "epoch:  36  loss:  0.0031322152\n",
      "epoch:  37  loss:  0.003130522\n",
      "epoch:  38  loss:  0.0031295554\n",
      "epoch:  39  loss:  0.0031293428\n"
     ]
    }
   ],
   "source": [
    "# Initialize the model\n",
    "model_glad = glad_model(L=L, theta_init_offset=0.1, nF=3, H=3, USE_CUDA=USE_CUDA)\n",
    "optimizer_glad = get_optimizers(model_glad)\n",
    "# get the sample covariance matrix for GLAD: Note, adjust the mean if needed\n",
    "S = torch.matmul(X.t(), X)/X.shape[0] # DxD matrix\n",
    "for epoch in range(40):\n",
    "    optimizer_glad.zero_grad()\n",
    "    theta_pred, loss = glad(S, theta_true, model_glad, [D, INIT_DIAG, lambda_init, L],criterion_graph)\n",
    "#    print(theta_true.shape, theta_pred.shape)\n",
    "    loss.backward() # calculate the gradients\n",
    "    optimizer_glad.step() # update the weights\n",
    "    compare_theta = report_metrics(np.array(theta_true), theta_pred[0].detach().numpy())\n",
    "    print('epoch: ', epoch, ' loss: ', loss.detach().numpy()[0])\n",
    "    if epoch %5 == 0:\n",
    "        print(': Recovery :FDR, TPR, FPR, SHD, nnz_true, nnz_pred, precision, recall, Fb, aupr, auc ')\n",
    "        print( *np.around(compare_theta, 3))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "glad",
   "language": "python",
   "name": "glad"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.11"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
