{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "\n",
    "file_dir = \"../../condition/CCSCM\"\n",
    "\n",
    "file_id2ent = f\"{file_dir}/id2ent.json\"\n",
    "file_ent2id = f\"{file_dir}/ent2id.json\"\n",
    "file_id2rel = f\"{file_dir}/id2rel.json\"\n",
    "file_rel2id = f\"{file_dir}/rel2id.json\"\n",
    "\n",
    "with open(file_id2ent, 'r') as file:\n",
    "    cond_id2ent = json.load(file)\n",
    "with open(file_ent2id, 'r') as file:\n",
    "    cond_ent2id = json.load(file)\n",
    "with open(file_id2rel, 'r') as file:\n",
    "    cond_id2rel = json.load(file)\n",
    "with open(file_rel2id, 'r') as file:\n",
    "    cond_rel2id = json.load(file)\n",
    "\n",
    "\n",
    "file_dir = \"../../procedure/CCSPROC\"\n",
    "\n",
    "file_id2ent = f\"{file_dir}/id2ent.json\"\n",
    "file_ent2id = f\"{file_dir}/ent2id.json\"\n",
    "file_id2rel = f\"{file_dir}/id2rel.json\"\n",
    "file_rel2id = f\"{file_dir}/rel2id.json\"\n",
    "\n",
    "with open(file_id2ent, 'r') as file:\n",
    "    proc_id2ent = json.load(file)\n",
    "with open(file_ent2id, 'r') as file:\n",
    "    proc_ent2id = json.load(file)\n",
    "with open(file_id2rel, 'r') as file:\n",
    "    proc_id2rel = json.load(file)\n",
    "with open(file_rel2id, 'r') as file:\n",
    "    proc_rel2id = json.load(file)\n",
    "\n",
    "\n",
    "file_dir = \"../../drug/ATC3\"\n",
    "\n",
    "file_id2ent = f\"{file_dir}/id2ent.json\"\n",
    "file_ent2id = f\"{file_dir}/ent2id.json\"\n",
    "file_id2rel = f\"{file_dir}/id2rel.json\"\n",
    "file_rel2id = f\"{file_dir}/rel2id.json\"\n",
    "\n",
    "with open(file_id2ent, 'r') as file:\n",
    "    drug_id2ent = json.load(file)\n",
    "with open(file_ent2id, 'r') as file:\n",
    "    drug_ent2id = json.load(file)\n",
    "with open(file_id2rel, 'r') as file:\n",
    "    drug_id2rel = json.load(file)\n",
    "with open(file_rel2id, 'r') as file:\n",
    "    drug_rel2id = json.load(file)\n",
    "\n",
    "\n",
    "import csv\n",
    "\n",
    "condition_mapping_file = \"../../../resources/CCSCM.csv\"\n",
    "procedure_mapping_file = \"../../../resources/CCSPROC.csv\"\n",
    "drug_file = \"../../../resources/ATC.csv\"\n",
    "\n",
    "condition_dict = {}\n",
    "with open(condition_mapping_file, newline='') as csvfile:\n",
    "    reader = csv.DictReader(csvfile)\n",
    "    for row in reader:\n",
    "        condition_dict[row['code']] = row['name'].lower()\n",
    "\n",
    "procedure_dict = {}\n",
    "with open(procedure_mapping_file, newline='') as csvfile:\n",
    "    reader = csv.DictReader(csvfile)\n",
    "    for row in reader:\n",
    "        procedure_dict[row['code']] = row['name'].lower()\n",
    "\n",
    "drug_dict = {}\n",
    "with open(drug_file, newline='') as csvfile:\n",
    "    reader = csv.DictReader(csvfile)\n",
    "    for row in reader:\n",
    "        if row['level'] == '3.0':\n",
    "            drug_dict[row['code']] = row['name'].lower()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "cpd_id2ent = {}\n",
    "cpd_id2rel = {}\n",
    "\n",
    "for key in cond_id2ent.keys():\n",
    "    cpd_id2ent[key] = cond_id2ent[key]\n",
    "\n",
    "for key in proc_id2ent.keys():\n",
    "    cpd_id2ent[str(int(key)+len(cond_id2ent))] = proc_id2ent[key]\n",
    "\n",
    "for key in drug_id2ent.keys():\n",
    "    cpd_id2ent[str(int(key)+len(cond_id2ent)+len(proc_id2ent))] = drug_id2ent[key]\n",
    "\n",
    "cpd_ent2id = {value: key for key, value in cpd_id2ent.items()}\n",
    "\n",
    "\n",
    "for key in cond_id2rel.keys():\n",
    "    cpd_id2rel[key] = cond_id2rel[key]\n",
    "\n",
    "for key in proc_id2rel.keys():\n",
    "    cpd_id2rel[str(int(key)+len(cond_id2rel))] = proc_id2rel[key]\n",
    "\n",
    "for key in drug_id2rel.keys():\n",
    "    cpd_id2rel[str(int(key)+len(cond_id2rel)+len(proc_id2rel))] = drug_id2rel[key]\n",
    "\n",
    "cpd_rel2id = {value: key for key, value in cpd_id2rel.items()}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(42056, 9404)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(cpd_id2ent), len(cpd_id2rel)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "out_file_id2ent = f\"./id2ent.json\"\n",
    "out_file_ent2id = f\"./ent2id.json\"\n",
    "out_file_id2rel = f\"./id2rel.json\"\n",
    "out_file_rel2id = f\"./rel2id.json\"\n",
    "\n",
    "with open(out_file_id2ent, 'w') as file:\n",
    "    json.dump(cpd_id2ent, file, indent=6)\n",
    "with open(out_file_ent2id, 'w') as file:\n",
    "    json.dump(cpd_ent2id, file, indent=6)\n",
    "with open(out_file_id2rel, 'w') as file:\n",
    "    json.dump(cpd_id2rel, file, indent=6)\n",
    "with open(out_file_rel2id, 'w') as file:\n",
    "    json.dump(cpd_rel2id, file, indent=6)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pickle\n",
    "\n",
    "with open('../../../graphs/condition/CCSCM/entity_embedding.pkl', 'rb') as f:\n",
    "    cond_ent_emb = pickle.load(f)\n",
    "\n",
    "with open('../../../graphs/condition/CCSCM/relation_embedding.pkl', 'rb') as f:\n",
    "    cond_rel_emb = pickle.load(f)\n",
    "\n",
    "with open('../../../graphs/procedure/CCSPROC/entity_embedding.pkl', 'rb') as f:\n",
    "    proc_ent_emb = pickle.load(f)\n",
    "\n",
    "with open('../../../graphs/procedure/CCSPROC/relation_embedding.pkl', 'rb') as f:\n",
    "    proc_rel_emb = pickle.load(f)\n",
    "\n",
    "with open('../../../graphs/drug/ATC3/entity_embedding.pkl', 'rb') as f:\n",
    "    drug_ent_emb = pickle.load(f)\n",
    "\n",
    "with open('../../../graphs/drug/ATC3/relation_embedding.pkl', 'rb') as f:\n",
    "    drug_rel_emb = pickle.load(f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "((10845, 1536), (8502, 1536), (22709, 1536))"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cond_ent_emb.shape, proc_ent_emb.shape, drug_ent_emb.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "# cp_ent_emb = np.concatenate((cond_ent_emb, proc_ent_emb), axis=0)\n",
    "# cpd_ent_emb = np.concatenate((cp_ent_emb, drug_ent_emb), axis=0)\n",
    "\n",
    "cp_rel_emb = np.concatenate((cond_rel_emb, proc_rel_emb), axis=0)\n",
    "cpd_rel_emb = np.concatenate((cp_rel_emb, drug_rel_emb), axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "((19347, 1536), (42056, 1536))"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cp_ent_emb.shape, cpd_ent_emb.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "ent_emb_pkl = \"./entity_embedding.pkl\"\n",
    "rel_emb_pkl = \"./relation_embedding.pkl\"\n",
    "\n",
    "# with open(ent_emb_pkl, \"wb\") as file:\n",
    "#     pickle.dump(cpd_ent_emb, file)\n",
    "\n",
    "with open(rel_emb_pkl, \"wb\") as file:\n",
    "    pickle.dump(cpd_rel_emb, file)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3.8.13 ('kgc')",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.13"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "3d0509d9aa81f2882b18eeb72d4d23c32cae9029e9b99f63cde94ba86c35ac78"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
