{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "a6223f80-affd-46cc-867c-77a7939684e2",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import numpy as np\n",
    "import scanpy as sc"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "b07aa8a5-8867-4a07-ad97-fd7fab159fe4",
   "metadata": {},
   "outputs": [],
   "source": [
    "multi_file_path = 'data/op_train_multi_targets_0.h5ad'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "4c5642cb-53de-443b-9ee5-454bee7989a3",
   "metadata": {},
   "outputs": [],
   "source": [
    "def adata_dataset(\n",
    "    path: str,\n",
    "    embed_name: str = \"X_pca\",\n",
    "    label_name: str = \"day\",\n",
    "    max_dim: int = 100,\n",
    "):\n",
    "    \"\"\"Load Single Cell dataset from h5ad file using scanpy.\"\"\"\n",
    "\n",
    "    adata = sc.read_h5ad(path)\n",
    "    labels = adata.obs[label_name].astype(\"category\")\n",
    "    ulabels = labels.cat.categories\n",
    "    data = adata.obsm[embed_name][:, :max_dim]\n",
    "\n",
    "    return (data, labels.to_numpy(), ulabels.to_numpy())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "c7d7c42e-069e-49f3-af5d-97b4c951db93",
   "metadata": {},
   "outputs": [],
   "source": [
    "def extrac_data_pca(file_path,data_name,pca_num):\n",
    "    \n",
    "    data,sample_labels,ulabels = adata_dataset(file_path,max_dim=pca_num)\n",
    "    folder = f\"data/{data_name}_{pca_num}\"\n",
    "\n",
    "    os.makedirs(folder, exist_ok=True)\n",
    "    np.save(os.path.join(folder, \"data.npy\"), data)\n",
    "    np.save(os.path.join(folder, \"sample_labels.npy\"), sample_labels)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "e58be29b-7a34-45ee-9a3c-62517bdf1a99",
   "metadata": {},
   "outputs": [],
   "source": [
    "extrac_data_pca(multi_file_path,'multi',50)\n",
    "extrac_data_pca(multi_file_path,'multi',100)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python (JKOnet-star)",
   "language": "python",
   "name": "jkonet-star"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
