{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "import random\n",
    "import warnings\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import netplotbrain as ntb\n",
    "import matplotlib.pyplot as plt\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "\n",
    "warnings.filterwarnings('ignore')\n",
    "sys.path.insert(0, '../GRAPH_Framework-main')\n",
    "from tasks.experiment import ModelTest"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def adjacency_helper(adjacency_matrix):\n",
    "    connections = []\n",
    "    for i in range(len(adjacency_matrix)):\n",
    "        for j in range(len(adjacency_matrix[i])):\n",
    "            if i != j:\n",
    "                if np.abs(adjacency_matrix[i][j]) >= 0.05:\n",
    "                    connections.append([i, j])\n",
    "\n",
    "    df = pd.DataFrame(connections, columns=['i', 'j'])\n",
    "    return df\n",
    "\n",
    "def helper(global_runtime, mf_runtime, global_loss, mf_loss, global_disp, mf_disp):\n",
    "    mean_val1, mean_val2, mean_val3, mean_val4 = np.mean(global_loss), np.mean(mf_loss), np.mean(global_disp), np.mean(mf_disp)\n",
    "    mean_val5, std_val5 = np.mean(global_runtime), np.std(global_runtime)\n",
    "    mean_val6, std_val6 = np.mean(mf_runtime), np.std(mf_runtime)\n",
    "    output = f\"{mean_val1:.4f} & {mean_val2:.4f} & {(mean_val1-mean_val2)/mean_val1*100:.6f}\\% & {mean_val3:.7f} & {mean_val4:.7f} & +{(mean_val3-mean_val4)/mean_val3*100:.6f}\\% & {mean_val5:.3f} ($\\pm$ {std_val5:.2f}) & {mean_val6:.2f} ($\\pm$ {std_val6:.2f})\"\n",
    "    print(output)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### TADPOLE"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_data = pd.read_csv(\"../Source_Data/ADNI all/TADPOLE_D1_D2.csv\")\n",
    "df_dict = pd.read_csv(\"../Source_Data/ADNI all/TADPOLE_D1_D2_Dict.csv\")\n",
    "adni = pd.read_csv('../Source_Data/ADNI all/ADNIMERGE.csv').reset_index(drop=True)\n",
    "ROI = pd.read_csv('../Source_Data/ADNI all/G_lobe_yeo.csv').reset_index(drop=True)\n",
    "ROI = ROI['Unnamed: 0'].to_list()\n",
    "\n",
    "atlas = pd.read_csv('../Source_Data/ADNI all/dk.csv')\n",
    "nodes_df = atlas[['x.mni', 'y.mni', 'z.mni']]\n",
    "nodes_df.columns = ['x', 'y', 'z']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## Check the location of the AV45 (cortical data)\n",
    "# Extract target rows in the dict file\n",
    "df_dict_av45 = df_dict.iloc[1201:1448,:]\n",
    "\n",
    "df_dict_av45ctx = df_dict_av45[df_dict_av45['FLDNAME'].str.contains('CTX_')& df_dict_av45['FLDNAME'].str.contains('SUVR')]\n",
    "df_dict_av45ctx = df_dict_av45ctx[ df_dict_av45ctx[\"FLDNAME\" ].str.contains( \"UNKNOWN\" )==False ]\n",
    "\n",
    "df_dict_av45wc = df_dict_av45[df_dict_av45['FLDNAME'].str.contains('WHOLECEREBELLUM_SUVR')]\n",
    "df_dict_av45ctx\n",
    "\n",
    "# Extract ID, DX, VISCODE, target features in the dataset\n",
    "\n",
    "df_label = df_data[[\"RID\",\"VISCODE\"]]\n",
    "df_features = df_data.iloc[:,df_dict_av45ctx.index-9] # cortical calues\n",
    "df_ref = df_data.iloc[:,df_dict_av45wc.index-9] # refrence regions\n",
    "\n",
    "for i in range(0,df_features.shape[-1]):\n",
    "    df_features.iloc[:,i] = pd.to_numeric(df_features.iloc[:,i].str.replace(\",\", \"\"), errors='coerce') # to remove nan values\n",
    "df_ref.iloc[:,0] = pd.to_numeric(df_ref.iloc[:,0].str.replace(\",\", \"\"), errors='coerce')\n",
    "\n",
    "# drop nan\n",
    "df_feature_av45 = pd.concat([df_features,df_label],axis=1)\n",
    "df_feature_av45 = df_feature_av45.dropna(thresh=68)\n",
    "df_ref = df_ref.dropna()\n",
    "\n",
    "# extract column name\n",
    "col_name_av45 = []\n",
    "for i in range(df_feature_av45.shape[1]-df_label.shape[1]):\n",
    "    col_name_av45.append(\"_\".join(df_feature_av45.columns.values[i].split('_')[1:3]))\n",
    "col_name_av45 = np.concatenate((col_name_av45,df_feature_av45.columns.values[-3:]))\n",
    "\n",
    "# normalization\n",
    "df_feature_av45_norm = pd.DataFrame(columns=col_name_av45)\n",
    "\n",
    "for i in range (df_feature_av45.shape[1]-df_label.shape[1]):\n",
    "    df_feature_av45_norm.iloc[:,i] = df_feature_av45.iloc[:,i]/df_ref.iloc[:,0]\n",
    "df_feature_av45_norm.iloc[:,-3:] = df_feature_av45.iloc[:,-3:]\n",
    "\n",
    "df_feature_av45_norm = df_feature_av45_norm.reset_index(drop=True)\n",
    "df_feature_av45_norm\n",
    "\n",
    "# Select first visit\n",
    "\n",
    "# Choose the first session if more than 1 session\n",
    "RIDu = df_feature_av45_norm[\"RID\"].unique()\n",
    "df_av45bl = pd.DataFrame()\n",
    "for i in range(len(RIDu)):\n",
    "    df1 = df_feature_av45_norm.loc[(df_feature_av45_norm['RID'] == RIDu[i])].head(1)\n",
    "    df_av45bl=pd.concat([df_av45bl,df1],axis=0)\n",
    "df_av45bl = df_av45bl.reset_index()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## Check the location of the AV1451 (cortical data)\n",
    "# Extract target rows in the dict file\n",
    "df_dict_tau = df_dict.iloc[1450:1691,:]\n",
    "\n",
    "df_dict_tauctx = df_dict_tau[df_dict_tau['FLDNAME'].str.contains('CTX_')& df_dict_tau['FLDNAME'].str.contains('SUVR')]\n",
    "df_dict_tauctx = df_dict_tauctx[ df_dict_tauctx[\"FLDNAME\" ].str.contains( \"UNKNOWN\" )==False ]\n",
    "\n",
    "df_dict_tauic = df_dict_tau[df_dict_tau['FLDNAME'].str.contains('INFERIORCEREBELLUM_SUVR')]\n",
    "df_dict_tauctx\n",
    "\n",
    "# Extract ID, DX, VISCODE, target features in the dataset\n",
    "df_label = df_data[[\"RID\",\"VISCODE\",\"ADAS13\"]] #MMSE,ADAS11\n",
    "df_features = df_data.iloc[:,df_dict_tauctx.index-12] # cortical calues\n",
    "df_ref = df_data.iloc[:,df_dict_tauic.index-12] # refrence regions\n",
    "\n",
    "for i in range(0,df_features.shape[-1]):\n",
    "    df_features.iloc[:,i] = pd.to_numeric(df_features.iloc[:,i].str.replace(\",\", \"\"), errors='coerce') # to remove nan values\n",
    "df_ref.iloc[:,0] = pd.to_numeric(df_ref.iloc[:,0].str.replace(\",\", \"\"), errors='coerce')\n",
    "\n",
    "# drop nan\n",
    "df_feature_tau = pd.concat([df_features,df_label],axis=1)\n",
    "df_feature_tau = df_feature_tau.dropna(thresh=68)\n",
    "df_ref = df_ref.dropna()\n",
    "\n",
    "# extract column name\n",
    "col_name_tau = []\n",
    "for i in range(df_feature_tau.shape[1]-df_label.shape[1]):\n",
    "    col_name_tau.append(\"_\".join(df_feature_tau.columns.values[i].split('_')[1:3]))\n",
    "col_name_tau = np.concatenate((col_name_tau,df_feature_tau.columns.values[-3:]))\n",
    "\n",
    "# normalization\n",
    "df_feature_tau_norm = pd.DataFrame(columns=col_name_tau)\n",
    "\n",
    "for i in range (df_feature_tau.shape[1]-df_label.shape[1]):\n",
    "    df_feature_tau_norm.iloc[:,i] = df_feature_tau.iloc[:,i]/df_ref.iloc[:,0]\n",
    "df_feature_tau_norm.iloc[:,-3:] = df_feature_tau.iloc[:,-3:]\n",
    "\n",
    "df_feature_tau_norm = df_feature_tau_norm.reset_index(drop=True)\n",
    "df_feature_tau_norm\n",
    "\n",
    "# Choose the first session if more than 1 session\n",
    "RIDu = df_feature_tau_norm[\"RID\"].unique()\n",
    "df_taubl = pd.DataFrame()\n",
    "for i in range(len(RIDu)):\n",
    "    df1 = df_feature_tau_norm.loc[(df_feature_tau_norm['RID'] == RIDu[i])].head(1)\n",
    "    df_taubl=pd.concat([df_taubl,df1],axis=0)\n",
    "df_taubl = df_taubl.reset_index()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### AV45"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.merge(df_av45bl, adni[['RID', 'PTGENDER', 'PTMARRY', 'PTRACCAT', 'VISCODE']], \n",
    "              how='inner', left_on=['RID','VISCODE'], right_on=['RID','VISCODE']).dropna()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## MARITAL STATUS\n",
    "known = df.loc[df['PTMARRY'] != 'Unknown'].dropna()\n",
    "married = known.loc[known['PTMARRY'] == 'Married']\n",
    "single = known.loc[known['PTMARRY'] == 'Never married']\n",
    "\n",
    "av45 = np.array(known[ROI].dropna())\n",
    "av451 = np.array(single[ROI].dropna())\n",
    "av452 = np.array(married[ROI].dropna())\n",
    "\n",
    "scaler = StandardScaler()\n",
    "D = scaler.fit_transform(av45.T).T\n",
    "D1 = scaler.fit_transform(av451.T).T\n",
    "D2 = scaler.fit_transform(av452.T).T\n",
    "D_lt = [D1, D2]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "parameters = {'max_iter':1000, 'lam':0.3, 'lamm':0.3, 'rhom':1, 'tol':1e-10} # MARITAL STATUS\n",
    "precision_train = ModelTest(model_type='Precision',showfig=False)\n",
    "precision_train.group_graph(D,D_lt,parameters)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "precision_train.runtime(1,D,D_lt,parameters)\n",
    "precision_train.summary()\n",
    "precision_train.plot()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def adjacency_helper(adjacency_matrix, threshold=0.05): # MARITAL STATUS\n",
    "    connections = []\n",
    "    for i in range(len(adjacency_matrix)):\n",
    "        for j in range(len(adjacency_matrix[i])):\n",
    "            if i != j:\n",
    "                if np.abs(adjacency_matrix[i][j]) >= threshold:\n",
    "                    connections.append([i, j])\n",
    "\n",
    "    df = pd.DataFrame(connections, columns=['i', 'j'])\n",
    "    return df\n",
    "\n",
    "def soft_thresholding(matrix, threshold=0.05):\n",
    "    return np.sign(matrix) * np.maximum(np.abs(matrix) - threshold, 0)\n",
    "\n",
    "# \n",
    "edges_df1 = adjacency_helper(precision_train.global_output)\n",
    "edges_df2 = adjacency_helper(precision_train.mf_output)\n",
    "diff_edges = adjacency_helper(precision_train.global_output - precision_train.mf_output, threshold=0.05)\n",
    "\n",
    "# \n",
    "unique1 = pd.merge(edges_df1, diff_edges, left_on=['i','j'], right_on=['i','j'], how='inner')\n",
    "unique2 = pd.merge(edges_df2, diff_edges, left_on=['i','j'], right_on=['i','j'], how='inner')\n",
    "\n",
    "# \n",
    "concat_df = pd.concat([unique1, unique2])\n",
    "duplicate_mask = concat_df.duplicated(keep=False)\n",
    "df1_filtered = unique1[~duplicate_mask[:len(unique1)]]\n",
    "df2_filtered = unique2[~duplicate_mask[len(unique2):]]\n",
    "\n",
    "# \n",
    "adjacency_matrix1 = np.zeros((68, 68))\n",
    "for i in range(len(unique1)):\n",
    "    adjacency_matrix1[int(unique1.iloc[i][0])][int(unique1.iloc[i][1])] = 1\n",
    "\n",
    "adjacency_matrix2 = np.zeros((68, 68))\n",
    "for i in range(len(unique2)):\n",
    "    adjacency_matrix2[int(unique2.iloc[i][0])][int(unique2.iloc[i][1])] = 1\n",
    "\n",
    "# \n",
    "community1 = set(list(np.array(unique1).flatten()))\n",
    "nodes_df1 = nodes_df.copy()\n",
    "nodes_df1['communities'] = np.NAN\n",
    "nodes_df1['degree_centrality'] = np.NAN\n",
    "for index in community1:\n",
    "    nodes_df1['communities'][index] = 2\n",
    "    nodes_df1['degree_centrality'][index] = 2\n",
    "\n",
    "nodes_df1['communities'] = nodes_df1['communities'].fillna(1)\n",
    "nodes_df1['degree_centrality'] = nodes_df1['degree_centrality'].fillna(1)\n",
    "\n",
    "# \n",
    "community2 = set(list(np.array(unique2).flatten()))\n",
    "nodes_df2 = nodes_df.copy()\n",
    "nodes_df2['communities'] = np.NAN\n",
    "nodes_df2['degree_centrality'] = np.NAN\n",
    "for index in community2:\n",
    "    nodes_df2['communities'][index] = 2\n",
    "    nodes_df2['degree_centrality'][index] = 2\n",
    "\n",
    "nodes_df2['communities'] = nodes_df2['communities'].fillna(1)\n",
    "nodes_df2['degree_centrality'] = nodes_df2['degree_centrality'].fillna(1)\n",
    "\n",
    "# \n",
    "ntb.plot(template='MNI152NLin2009cAsym', template_style='glass', view=['LSA'],\n",
    "         nodes=nodes_df1, edges=edges_df1,  highlight_edges=adjacency_matrix1, highlight_level=0.85,\n",
    "         node_color='communities', edge_color='lightblue', node_size='degree_centrality', arrowaxis=None)\n",
    "\n",
    "plt.savefig('brain_standard.png', dpi=300, bbox_inches='tight', pad_inches=0.1)\n",
    "plt.show()\n",
    "\n",
    "# \n",
    "highlights2 = np.array(edges_df2[~edges_df2.isin(edges_df1)].dropna())\n",
    "ntb.plot(template='MNI152NLin2009cAsym', template_style='glass', view=['LSA'],\n",
    "         nodes=nodes_df2, edges=edges_df2, highlight_edges=adjacency_matrix2, highlight_level=0.85,\n",
    "         node_color='communities', edge_color='lightblue', node_size='degree_centrality', arrowaxis=None)\n",
    "\n",
    "plt.savefig('brain_fair.png', dpi=300, bbox_inches='tight', pad_inches=0.1)\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Tau"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.merge(df_taubl, adni[['RID', 'PTGENDER', 'PTMARRY', 'PTRACCAT', 'VISCODE']], how='inner', left_on=['RID','VISCODE'], right_on=['RID','VISCODE']).dropna()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## RACE\n",
    "white = df.loc[df['PTRACCAT'] == 'White']\n",
    "nonwhite = df.loc[df['PTRACCAT'] != 'White']\n",
    "\n",
    "av45 = np.array(df[ROI].dropna())\n",
    "av451 = np.array(white[ROI].dropna())\n",
    "av452 = np.array(nonwhite[ROI].dropna())\n",
    "\n",
    "scaler = StandardScaler()\n",
    "D = scaler.fit_transform(av45.T).T\n",
    "D1 = scaler.fit_transform(av451.T).T\n",
    "D2 = scaler.fit_transform(av452.T).T\n",
    "D_lt = [D1, D2]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "parameters = {'max_iter':1000, 'lam':0.2, 'lamm':0.2, 'rhom':1, 'tol':1e-10}\n",
    "precision_train = ModelTest(model_type='Precision',showfig=False)\n",
    "precision_train.group_graph(D,D_lt,parameters)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "precision_train.runtime(1,D,D_lt,parameters)\n",
    "precision_train.summary()\n",
    "precision_train.plot()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def adjacency_helper(adjacency_matrix, threshold=0.1): # RACE\n",
    "    connections = []\n",
    "    for i in range(len(adjacency_matrix)):\n",
    "        for j in range(len(adjacency_matrix[i])):\n",
    "            if i != j:\n",
    "                if np.abs(adjacency_matrix[i][j]) >= threshold:\n",
    "                    connections.append([i, j])\n",
    "\n",
    "    df = pd.DataFrame(connections, columns=['i', 'j'])\n",
    "    return df\n",
    "\n",
    "def soft_thresholding(matrix, threshold=0.05):\n",
    "    return np.sign(matrix) * np.maximum(np.abs(matrix) - threshold, 0)\n",
    "\n",
    "# \n",
    "edges_df1 = adjacency_helper(precision_train.global_output)\n",
    "edges_df2 = adjacency_helper(precision_train.mf_output)\n",
    "diff_edges = adjacency_helper(precision_train.global_output - precision_train.mf_output, threshold=0.05)\n",
    "\n",
    "# \n",
    "unique1 = pd.merge(edges_df1, diff_edges, left_on=['i','j'], right_on=['i','j'], how='inner')\n",
    "unique2 = pd.merge(edges_df2, diff_edges, left_on=['i','j'], right_on=['i','j'], how='inner')\n",
    "\n",
    "# \n",
    "concat_df = pd.concat([unique1, unique2])\n",
    "duplicate_mask = concat_df.duplicated(keep=False)\n",
    "df1_filtered = unique1[~duplicate_mask[:len(unique1)]]\n",
    "df2_filtered = unique2[~duplicate_mask[len(unique2):]]\n",
    "\n",
    "# \n",
    "adjacency_matrix1 = np.zeros((68, 68))\n",
    "for i in range(len(unique1)):\n",
    "    adjacency_matrix1[int(unique1.iloc[i][0])][int(unique1.iloc[i][1])] = 1\n",
    "\n",
    "adjacency_matrix2 = np.zeros((68, 68))\n",
    "for i in range(len(unique2)):\n",
    "    adjacency_matrix2[int(unique2.iloc[i][0])][int(unique2.iloc[i][1])] = 1\n",
    "\n",
    "# \n",
    "community1 = set(list(np.array(unique1).flatten()))\n",
    "nodes_df1 = nodes_df.copy()\n",
    "nodes_df1['communities'] = np.NAN\n",
    "nodes_df1['degree_centrality'] = np.NAN\n",
    "for index in community1:\n",
    "    nodes_df1['communities'][index] = 2\n",
    "    nodes_df1['degree_centrality'][index] = 2\n",
    "\n",
    "# \n",
    "nodes_df1['communities'] = nodes_df1['communities'].fillna(1)\n",
    "nodes_df1['degree_centrality'] = nodes_df1['degree_centrality'].fillna(1)\n",
    "\n",
    "community2 = set(list(np.array(unique2).flatten()))\n",
    "nodes_df2 = nodes_df.copy()\n",
    "nodes_df2['communities'] = np.NAN\n",
    "nodes_df2['degree_centrality'] = np.NAN\n",
    "for index in community2:\n",
    "    nodes_df2['communities'][index] = 2\n",
    "    nodes_df2['degree_centrality'][index] = 2\n",
    "\n",
    "# \n",
    "nodes_df2['communities'] = nodes_df2['communities'].fillna(1)\n",
    "nodes_df2['degree_centrality'] = nodes_df2['degree_centrality'].fillna(1)\n",
    "\n",
    "# \n",
    "ntb.plot(template='MNI152NLin2009cAsym', template_style='glass', view=['LSA'],\n",
    "         nodes=nodes_df1, edges=edges_df1,  highlight_edges=adjacency_matrix1, highlight_level=0.85,\n",
    "         node_color='communities', edge_color='darkorange', node_size='degree_centrality', arrowaxis=None)\n",
    "\n",
    "plt.savefig('brain_standard.png', dpi=300, bbox_inches='tight', pad_inches=0.1)\n",
    "plt.show()\n",
    "\n",
    "# \n",
    "highlights2 = np.array(edges_df2[~edges_df2.isin(edges_df1)].dropna())\n",
    "ntb.plot(template='MNI152NLin2009cAsym', template_style='glass', view=['LSA'],\n",
    "         nodes=nodes_df2, edges=edges_df2, highlight_edges=adjacency_matrix2, highlight_level=0.85,\n",
    "         node_color='communities', edge_color='darkorange', node_size='degree_centrality', arrowaxis=None)\n",
    "\n",
    "plt.savefig('brain_fair.png', dpi=300, bbox_inches='tight', pad_inches=0.1)\n",
    "plt.show()\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Graph_Learning",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.4"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
