{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/users/sukwon/anaconda3/envs/test/lib/python3.9/site-packages/scipy/__init__.py:132: UserWarning: A NumPy version >=1.21.6 and <1.28.0 is required for this version of SciPy (detected version 1.21.5)\n",
      "  warnings.warn(f\"A NumPy version >={np_minversion} and <{np_maxversion}\"\n"
     ]
    }
   ],
   "source": [
    "import anndata as ad\n",
    "import numpy as np\n",
    "import scanpy as sc\n",
    "import pandas as pd\n",
    "\n",
    "\n",
    "import seaborn as sns\n",
    "from collections import Counter\n",
    "from sklearn.neighbors import NearestNeighbors\n",
    "import pandas as pd\n",
    "import sys\n",
    "sys.path.append('..')\n",
    "import matplotlib.pyplot as plt\n",
    "from sklearn.metrics import adjusted_rand_score\n",
    "import os\n",
    "# os.chdir(os.path.dirname(os.path.abspath(__file__))) # debugging\n",
    "\n",
    "from scipy.stats import spearmanr, pearsonr\n",
    "from sklearn import preprocessing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 77,
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_adata(data, modalities='pPDm'):\n",
    "    adata = ad.AnnData(X=np.zeros((data['view_0'].shape[0], 1)))  # Placeholder for X\n",
    "\n",
    "    # Add views to obsm according to modalities\n",
    "    for i, modality in enumerate(modalities):\n",
    "        key = f'view_{i}'\n",
    "        adata.obsm[modality] = data[key]\n",
    "\n",
    "    # If you want to add observation names\n",
    "    adata.obs = pd.DataFrame(np.arange(data['view_0'].shape[0]))\n",
    "    adata.obs = adata.obs.iloc[:,1:]\n",
    "    \n",
    "    adata.obs['label'] = data['labels']\n",
    "    \n",
    "    return adata"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 71,
   "metadata": {},
   "outputs": [],
   "source": [
    "# data_path = './UnitedNet_NatComm_data/Dyngen'\n",
    "# view = 'mean' # '0' or '1', 'mean'\n",
    "\n",
    "# for cv_idx in range(5):\n",
    "#     Pm_train = np.load(data_path+f'/dyngen_linear_train_cv{cv_idx}_Pm.npz')\n",
    "#     pPRm_train = np.load(data_path+f'/dyngen_linear_train_cv{cv_idx}_pPRm.npz')\n",
    "#     PRmp_train = np.load(data_path+f'/dyngen_linear_train_cv{cv_idx}_PRmp.npz')\n",
    "#     Rm_train = np.load(data_path+f'/dyngen_linear_train_cv{cv_idx}_Rm.npz')\n",
    "\n",
    "#     Pm_test = np.load(data_path+f'/dyngen_linear_test_cv{cv_idx}_Pm.npz')\n",
    "#     pPRm_test = np.load(data_path+f'/dyngen_linear_test_cv{cv_idx}_pPRm.npz')\n",
    "#     PRmp_test = np.load(data_path+f'/dyngen_linear_test_cv{cv_idx}_PRmp.npz')\n",
    "#     Rm_test = np.load(data_path+f'/dyngen_linear_test_cv{cv_idx}_Rm.npz')\n",
    "\n",
    "#     Pm_train = generate_adata(Pm_train, view)\n",
    "#     pPRm_train = generate_adata(pPRm_train, view)\n",
    "#     PRmp_train = generate_adata(PRmp_train, view)\n",
    "#     Rm_train = generate_adata(Rm_train, view)\n",
    "\n",
    "#     Pm_test = generate_adata(Pm_test, view)\n",
    "#     pPRm_test = generate_adata(pPRm_test, view)\n",
    "#     PRmp_test = generate_adata(PRmp_test, view)\n",
    "#     Rm_test = generate_adata(Rm_test, view)\n",
    "\n",
    "#     Pm_train.write(data_path + f'/adata_Pm_train_cv_{str(cv_idx)}_view_{view}.h5ad')\n",
    "#     pPRm_train.write(data_path + f'/adata_pPRm_train_cv_{str(cv_idx)}_view_{view}.h5ad')\n",
    "#     PRmp_train.write(data_path + f'/adata_PRmp_train_cv_{str(cv_idx)}_view_{view}.h5ad')\n",
    "#     Rm_train.write(data_path + f'/adata_Rm_train_cv_{str(cv_idx)}_view_{view}.h5ad')\n",
    "\n",
    "#     Pm_test.write(data_path + f'/adata_Pm_test_cv_{str(cv_idx)}_view_{view}.h5ad')\n",
    "#     pPRm_test.write(data_path + f'/adata_pPRm_test_cv_{str(cv_idx)}_view_{view}.h5ad')\n",
    "#     PRmp_test.write(data_path + f'/adata_PRmp_test_cv_{str(cv_idx)}_view_{view}.h5ad')\n",
    "#     Rm_test.write(data_path + f'/adata_Rm_test_cv_{str(cv_idx)}_view_{view}.h5ad')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {},
   "outputs": [],
   "source": [
    "data_path = './UnitedNet_NatComm_data/Dyngen'\n",
    "\n",
    "for cv_idx in range(5):\n",
    "    pPRm_train = np.load(data_path+f'/dyngen_linear_train_cv{cv_idx}_pPRm.npz')\n",
    "    pPRm_test = np.load(data_path+f'/dyngen_linear_test_cv{cv_idx}_pPRm.npz')\n",
    "\n",
    "    pPRm_train = generate_adata(pPRm_train, modalities='pPDm')\n",
    "    pPRm_test = generate_adata(pPRm_test, modalities='pPDm')\n",
    "    \n",
    "    pPRm_train.write(data_path + f'/adata_pPRm_train_cv_{str(cv_idx)}.h5ad')\n",
    "    pPRm_test.write(data_path + f'/adata_pPRm_test_cv_{str(cv_idx)}.h5ad')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[ 0.61121568, -3.18135532,  0.58849298, ..., -0.5370795 ,\n",
       "        -0.59170906, -0.57164054],\n",
       "       [ 0.4499125 , -3.18135532,  1.12775108, ..., -0.5370795 ,\n",
       "        -0.59170906, -0.57164054],\n",
       "       [ 0.3252794 ,  0.39300304,  0.50720241, ..., -0.5370795 ,\n",
       "        -0.59170906, -0.57164054],\n",
       "       ...,\n",
       "       [ 0.84823018,  0.82689732,  0.80938191, ..., -0.5370795 ,\n",
       "        -0.59170906, -0.57164054],\n",
       "       [ 0.41233362, -0.39722286, -1.67280028, ..., -0.5370795 ,\n",
       "        -0.59170906, -0.57164054],\n",
       "       [ 1.01171411, -3.18135532,  0.6439314 , ..., -0.5370795 ,\n",
       "        -0.59170906, -0.57164054]])"
      ]
     },
     "execution_count": 80,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pPRm_train.obsm['p']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3.9.18 ('test')",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.16"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "eae09bf71f880f5d1d9ce3367b3975f7f40d81b42cbf95bb2da649c5d0b35075"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
