{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "f8c3e0a4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/data1/anonymous/codes/anonymous\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "os.chdir(\"../\")\n",
    "print(os.getcwd())"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e593908a",
   "metadata": {},
   "source": [
    "First fix the key in one json file:\n",
    "```bash\n",
    "python scripts/fix_key_in_chest_ct_scan.py\n",
    "```"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "70f7dcd7",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "from pathlib import Path\n",
    "from pprint import pformat\n",
    "from collections import Counter, defaultdict\n",
    "import numpy as np\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "28c03c11",
   "metadata": {},
   "outputs": [],
   "source": [
    "vqa_json_dir = Path(\"data/OmniMedVQA/QA_information/Open-access\")\n",
    "# vqa_json_dir = Path(\"data/OmniMedVQA/QA_information/Restricted-access\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "91edb4a1",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Number of VQA JSON files: 42\n"
     ]
    }
   ],
   "source": [
    "vqa_json_list = list(vqa_json_dir.glob(\"*.json\"))\n",
    "print(f\"Number of VQA JSON files: {len(vqa_json_list)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "16b8bdf4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Example VQA JSON file: data/OmniMedVQA/QA_information/Open-access/Chest CT Scan.json\n",
      "Number of samples: 871\n",
      "One sample: {'dataset': 'Chest CT Scan',\n",
      " 'gt_answer': 'CT',\n",
      " 'image_path': 'Images/Chest CT '\n",
      "               'Scan/test/adenocarcinoma_left.lower.lobe_T2_N0_M0_Ib/000143 '\n",
      "               '(6).png',\n",
      " 'modality_type': 'CT(Computed Tomography)',\n",
      " 'option_A': 'Angiography',\n",
      " 'option_B': 'Electrocardiogram (ECG)',\n",
      " 'option_C': 'Mammogram',\n",
      " 'option_D': 'CT',\n",
      " 'question': 'What imaging technique was employed for capturing this image?',\n",
      " 'question_id': 'Chest CT Scan_0000',\n",
      " 'question_type': 'Modality Recognition'}\n"
     ]
    }
   ],
   "source": [
    "one_vqa_json = vqa_json_list[0]\n",
    "print(f\"Example VQA JSON file: {one_vqa_json}\")\n",
    "\n",
    "with open(one_vqa_json, \"r\") as f:\n",
    "    data = json.load(f)\n",
    "print(f\"Number of samples: {len(data)}\")\n",
    "print(f\"One sample: {pformat(data[0])}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "7270db40",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Validated JSON file 1/42: data/OmniMedVQA/QA_information/Open-access/Chest CT Scan.json\n",
      "Validated JSON file 2/42: data/OmniMedVQA/QA_information/Open-access/SARS-CoV-2 CT-scan.json\n",
      "Validated JSON file 3/42: data/OmniMedVQA/QA_information/Open-access/ISIC2019.json\n",
      "Validated JSON file 4/42: data/OmniMedVQA/QA_information/Open-access/Adam Challenge.json\n",
      "Validated JSON file 5/42: data/OmniMedVQA/QA_information/Open-access/OLIVES.json\n",
      "Validated JSON file 6/42: data/OmniMedVQA/QA_information/Open-access/Mura.json\n",
      "Validated JSON file 7/42: data/OmniMedVQA/QA_information/Open-access/ISBI2016.json\n",
      "Validated JSON file 8/42: data/OmniMedVQA/QA_information/Open-access/Retinal OCT-C8.json\n",
      "Validated JSON file 9/42: data/OmniMedVQA/QA_information/Open-access/ISIC2018.json\n",
      "Validated JSON file 10/42: data/OmniMedVQA/QA_information/Open-access/Fitzpatrick 17k.json\n",
      "Validated JSON file 11/42: data/OmniMedVQA/QA_information/Open-access/DeepDRiD.json\n",
      "Validated JSON file 12/42: data/OmniMedVQA/QA_information/Open-access/BreakHis.json\n",
      "Validated JSON file 13/42: data/OmniMedVQA/QA_information/Open-access/MAlig Lymph.json\n",
      "Validated JSON file 14/42: data/OmniMedVQA/QA_information/Open-access/Knee Osteoarthritis.json\n",
      "Validated JSON file 15/42: data/OmniMedVQA/QA_information/Open-access/PALM2019.json\n",
      "Validated JSON file 16/42: data/OmniMedVQA/QA_information/Open-access/HuSHeM.json\n",
      "Validated JSON file 17/42: data/OmniMedVQA/QA_information/Open-access/Pulmonary Chest MC.json\n",
      "Validated JSON file 18/42: data/OmniMedVQA/QA_information/Open-access/ACRIMA.json\n",
      "Validated JSON file 19/42: data/OmniMedVQA/QA_information/Open-access/Chest X-Ray PA.json\n",
      "Validated JSON file 20/42: data/OmniMedVQA/QA_information/Open-access/COVIDx CXR-4.json\n",
      "Validated JSON file 21/42: data/OmniMedVQA/QA_information/Open-access/DRIMDB.json\n",
      "Validated JSON file 22/42: data/OmniMedVQA/QA_information/Open-access/Covid-19 tianchi.json\n",
      "Validated JSON file 23/42: data/OmniMedVQA/QA_information/Open-access/RadImageNet.json\n",
      "Validated JSON file 24/42: data/OmniMedVQA/QA_information/Open-access/RUS CHN.json\n",
      "Validated JSON file 25/42: data/OmniMedVQA/QA_information/Open-access/Covid19 heywhale.json\n",
      "Validated JSON file 26/42: data/OmniMedVQA/QA_information/Open-access/JSIEC.json\n",
      "Validated JSON file 27/42: data/OmniMedVQA/QA_information/Open-access/BioMediTech.json\n",
      "Validated JSON file 28/42: data/OmniMedVQA/QA_information/Open-access/NLM- Malaria Data.json\n",
      "Validated JSON file 29/42: data/OmniMedVQA/QA_information/Open-access/Diabetic Retinopathy.json\n",
      "Validated JSON file 30/42: data/OmniMedVQA/QA_information/Open-access/CoronaHack.json\n",
      "Validated JSON file 31/42: data/OmniMedVQA/QA_information/Open-access/Blood Cell.json\n",
      "Validated JSON file 32/42: data/OmniMedVQA/QA_information/Open-access/ISIC2020.json\n",
      "Validated JSON file 33/42: data/OmniMedVQA/QA_information/Open-access/Yangxi.json\n",
      "Validated JSON file 34/42: data/OmniMedVQA/QA_information/Open-access/MIAS.json\n",
      "Validated JSON file 35/42: data/OmniMedVQA/QA_information/Open-access/MHSMA.json\n",
      "Validated JSON file 36/42: data/OmniMedVQA/QA_information/Open-access/OCT & X-Ray 2017.json\n",
      "Validated JSON file 37/42: data/OmniMedVQA/QA_information/Open-access/ALL Challenge.json\n",
      "Validated JSON file 38/42: data/OmniMedVQA/QA_information/Open-access/Pulmonary Chest Shenzhen.json\n",
      "Validated JSON file 39/42: data/OmniMedVQA/QA_information/Open-access/PAD-UFES-20.json\n",
      "Validated JSON file 40/42: data/OmniMedVQA/QA_information/Open-access/Monkeypox Skin Image 2022.json\n",
      "Validated JSON file 41/42: data/OmniMedVQA/QA_information/Open-access/Covid CT.json\n",
      "Validated JSON file 42/42: data/OmniMedVQA/QA_information/Open-access/CRC100k.json\n"
     ]
    }
   ],
   "source": [
    "# validate if all json are list of dictionaries\n",
    "# validate all items have the same keys\n",
    "template_keys = None\n",
    "for i, vqa_json in enumerate(vqa_json_list):\n",
    "    with open(vqa_json, \"r\") as f:\n",
    "        data = json.load(f)\n",
    "        if not isinstance(data, list):\n",
    "            raise ValueError(f\"JSON file {vqa_json} is not a list.\")\n",
    "        if not all(isinstance(item, dict) for item in data):\n",
    "            raise ValueError(f\"JSON file {vqa_json} does not contain all dictionaries.\")\n",
    "\n",
    "        if template_keys is None:\n",
    "            template_keys = set(data[0].keys())\n",
    "        keys = set(data[0].keys())\n",
    "        if keys != template_keys:\n",
    "            mismatched_keys = keys - template_keys\n",
    "            missing_keys = template_keys - keys\n",
    "            raise ValueError(f\"JSON file {vqa_json} has mismatched keys: {mismatched_keys} or missing keys: {missing_keys}\")\n",
    "        # print(f\"{vqa_json.stem}:\\t{sorted(keys)}\")\n",
    "\n",
    "    print(f\"Validated JSON file {i+1}/{len(vqa_json_list)}: {vqa_json}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "ff9d1c2c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "All modality types (8):\n",
      "['CT(Computed Tomography)',\n",
      " 'Dermoscopy',\n",
      " 'Fundus Photography',\n",
      " 'MR (Mag-netic Resonance Imaging)',\n",
      " 'Microscopy Images',\n",
      " 'OCT (Optical Coherence Tomography',\n",
      " 'X-Ray',\n",
      " 'ultrasound']\n",
      "All question types (5):\n",
      "['Anatomy Identification',\n",
      " 'Disease Diagnosis',\n",
      " 'Lesion Grading',\n",
      " 'Modality Recognition',\n",
      " 'Other Biological Attributes']\n"
     ]
    }
   ],
   "source": [
    "all_modality_types = set()\n",
    "all_question_types = set()\n",
    "for i, vqa_json in enumerate(vqa_json_list):\n",
    "    with open(vqa_json, \"r\") as f:\n",
    "        data = json.load(f)\n",
    "        for item in data:\n",
    "            all_modality_types.add(item[\"modality_type\"])\n",
    "            all_question_types.add(item[\"question_type\"])\n",
    "print(f\"All modality types ({len(all_modality_types)}):\\n{pformat(sorted(all_modality_types))}\")\n",
    "print(f\"All question types ({len(all_question_types)}):\\n{pformat(sorted(all_question_types))}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "457838dd",
   "metadata": {},
   "outputs": [],
   "source": [
    "def stat_types(data, all_modality_types, all_question_types):\n",
    "    modality_type_count = {k: 0 for k in all_modality_types}\n",
    "    question_type_count = {k: 0 for k in all_question_types}\n",
    "    for sample in data:\n",
    "        modality_type_count[sample[\"modality_type\"]] += 1\n",
    "        question_type_count[sample[\"question_type\"]] += 1\n",
    "    return modality_type_count, question_type_count\n",
    "\n",
    "def gather_stat_types(vqa_json_list, all_modality_types, all_question_types):\n",
    "    vqa_json_stats = defaultdict(dict)\n",
    "    for i, vqa_json in enumerate(vqa_json_list):\n",
    "        with open(vqa_json, \"r\") as f:\n",
    "            data = json.load(f)\n",
    "            modality_type_count, question_type_count = stat_types(data, all_modality_types, all_question_types)\n",
    "            vqa_json_stats[vqa_json.stem][\"modality_type_count\"] = modality_type_count\n",
    "            vqa_json_stats[vqa_json.stem][\"question_type_count\"] = question_type_count\n",
    "    return vqa_json_stats\n",
    "vqa_json_stats = gather_stat_types(vqa_json_list, all_modality_types, all_question_types)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "a151b4e5",
   "metadata": {},
   "outputs": [],
   "source": [
    "modality_type_df = pd.DataFrame.from_dict(\n",
    "    {k: v[\"modality_type_count\"] for k, v in vqa_json_stats.items()},\n",
    "    orient=\"index\",\n",
    ")\n",
    "question_type_df = pd.DataFrame.from_dict(\n",
    "    {k: v[\"question_type_count\"] for k, v in vqa_json_stats.items()},\n",
    "    orient=\"index\",\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "id": "82d770dc",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>OCT (Optical Coherence Tomography</th>\n",
       "      <th>Fundus Photography</th>\n",
       "      <th>MR (Mag-netic Resonance Imaging)</th>\n",
       "      <th>CT(Computed Tomography)</th>\n",
       "      <th>Microscopy Images</th>\n",
       "      <th>ultrasound</th>\n",
       "      <th>X-Ray</th>\n",
       "      <th>Dermoscopy</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Chest CT Scan</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>871</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SARS-CoV-2 CT-scan</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>910</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISIC2019</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1952</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Adam Challenge</th>\n",
       "      <td>0</td>\n",
       "      <td>87</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>OLIVES</th>\n",
       "      <td>0</td>\n",
       "      <td>593</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Mura</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1464</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISBI2016</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>681</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Retinal OCT-C8</th>\n",
       "      <td>4016</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISIC2018</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>272</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Fitzpatrick 17k</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1552</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>DeepDRiD</th>\n",
       "      <td>0</td>\n",
       "      <td>131</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BreakHis</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>735</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>MAlig Lymph</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>149</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Knee Osteoarthritis</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>518</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>PALM2019</th>\n",
       "      <td>0</td>\n",
       "      <td>510</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>HuSHeM</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>89</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Pulmonary Chest MC</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>38</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ACRIMA</th>\n",
       "      <td>0</td>\n",
       "      <td>159</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Chest X-Ray PA</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>850</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>COVIDx CXR-4</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>485</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>DRIMDB</th>\n",
       "      <td>0</td>\n",
       "      <td>132</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Covid-19 tianchi</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>96</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>RadImageNet</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>31877</td>\n",
       "      <td>13829</td>\n",
       "      <td>0</td>\n",
       "      <td>10991</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>RUS CHN</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1982</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Covid19 heywhale</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>690</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>JSIEC</th>\n",
       "      <td>0</td>\n",
       "      <td>220</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BioMediTech</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>511</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>NLM- Malaria Data</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>75</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Diabetic Retinopathy</th>\n",
       "      <td>0</td>\n",
       "      <td>2051</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoronaHack</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>684</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Blood Cell</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1175</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISIC2020</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1580</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Yangxi</th>\n",
       "      <td>0</td>\n",
       "      <td>1515</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>MIAS</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>142</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>MHSMA</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1282</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>OCT &amp; X-Ray 2017</th>\n",
       "      <td>630</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>671</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ALL Challenge</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>342</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Pulmonary Chest Shenzhen</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>296</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>PAD-UFES-20</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>479</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Monkeypox Skin Image 2022</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>163</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Covid CT</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>199</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CRC100k</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1322</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                           OCT (Optical Coherence Tomography  \\\n",
       "Chest CT Scan                                              0   \n",
       "SARS-CoV-2 CT-scan                                         0   \n",
       "ISIC2019                                                   0   \n",
       "Adam Challenge                                             0   \n",
       "OLIVES                                                     0   \n",
       "Mura                                                       0   \n",
       "ISBI2016                                                   0   \n",
       "Retinal OCT-C8                                          4016   \n",
       "ISIC2018                                                   0   \n",
       "Fitzpatrick 17k                                            0   \n",
       "DeepDRiD                                                   0   \n",
       "BreakHis                                                   0   \n",
       "MAlig Lymph                                                0   \n",
       "Knee Osteoarthritis                                        0   \n",
       "PALM2019                                                   0   \n",
       "HuSHeM                                                     0   \n",
       "Pulmonary Chest MC                                         0   \n",
       "ACRIMA                                                     0   \n",
       "Chest X-Ray PA                                             0   \n",
       "COVIDx CXR-4                                               0   \n",
       "DRIMDB                                                     0   \n",
       "Covid-19 tianchi                                           0   \n",
       "RadImageNet                                                0   \n",
       "RUS CHN                                                    0   \n",
       "Covid19 heywhale                                           0   \n",
       "JSIEC                                                      0   \n",
       "BioMediTech                                                0   \n",
       "NLM- Malaria Data                                          0   \n",
       "Diabetic Retinopathy                                       0   \n",
       "CoronaHack                                                 0   \n",
       "Blood Cell                                                 0   \n",
       "ISIC2020                                                   0   \n",
       "Yangxi                                                     0   \n",
       "MIAS                                                       0   \n",
       "MHSMA                                                      0   \n",
       "OCT & X-Ray 2017                                         630   \n",
       "ALL Challenge                                              0   \n",
       "Pulmonary Chest Shenzhen                                   0   \n",
       "PAD-UFES-20                                                0   \n",
       "Monkeypox Skin Image 2022                                  0   \n",
       "Covid CT                                                   0   \n",
       "CRC100k                                                    0   \n",
       "\n",
       "                           Fundus Photography  \\\n",
       "Chest CT Scan                               0   \n",
       "SARS-CoV-2 CT-scan                          0   \n",
       "ISIC2019                                    0   \n",
       "Adam Challenge                             87   \n",
       "OLIVES                                    593   \n",
       "Mura                                        0   \n",
       "ISBI2016                                    0   \n",
       "Retinal OCT-C8                              0   \n",
       "ISIC2018                                    0   \n",
       "Fitzpatrick 17k                             0   \n",
       "DeepDRiD                                  131   \n",
       "BreakHis                                    0   \n",
       "MAlig Lymph                                 0   \n",
       "Knee Osteoarthritis                         0   \n",
       "PALM2019                                  510   \n",
       "HuSHeM                                      0   \n",
       "Pulmonary Chest MC                          0   \n",
       "ACRIMA                                    159   \n",
       "Chest X-Ray PA                              0   \n",
       "COVIDx CXR-4                                0   \n",
       "DRIMDB                                    132   \n",
       "Covid-19 tianchi                            0   \n",
       "RadImageNet                                 0   \n",
       "RUS CHN                                     0   \n",
       "Covid19 heywhale                            0   \n",
       "JSIEC                                     220   \n",
       "BioMediTech                                 0   \n",
       "NLM- Malaria Data                           0   \n",
       "Diabetic Retinopathy                     2051   \n",
       "CoronaHack                                  0   \n",
       "Blood Cell                                  0   \n",
       "ISIC2020                                    0   \n",
       "Yangxi                                   1515   \n",
       "MIAS                                        0   \n",
       "MHSMA                                       0   \n",
       "OCT & X-Ray 2017                            0   \n",
       "ALL Challenge                               0   \n",
       "Pulmonary Chest Shenzhen                    0   \n",
       "PAD-UFES-20                                 0   \n",
       "Monkeypox Skin Image 2022                   0   \n",
       "Covid CT                                    0   \n",
       "CRC100k                                     0   \n",
       "\n",
       "                           MR (Mag-netic Resonance Imaging)  \\\n",
       "Chest CT Scan                                             0   \n",
       "SARS-CoV-2 CT-scan                                        0   \n",
       "ISIC2019                                                  0   \n",
       "Adam Challenge                                            0   \n",
       "OLIVES                                                    0   \n",
       "Mura                                                      0   \n",
       "ISBI2016                                                  0   \n",
       "Retinal OCT-C8                                            0   \n",
       "ISIC2018                                                  0   \n",
       "Fitzpatrick 17k                                           0   \n",
       "DeepDRiD                                                  0   \n",
       "BreakHis                                                  0   \n",
       "MAlig Lymph                                               0   \n",
       "Knee Osteoarthritis                                       0   \n",
       "PALM2019                                                  0   \n",
       "HuSHeM                                                    0   \n",
       "Pulmonary Chest MC                                        0   \n",
       "ACRIMA                                                    0   \n",
       "Chest X-Ray PA                                            0   \n",
       "COVIDx CXR-4                                              0   \n",
       "DRIMDB                                                    0   \n",
       "Covid-19 tianchi                                          0   \n",
       "RadImageNet                                           31877   \n",
       "RUS CHN                                                   0   \n",
       "Covid19 heywhale                                          0   \n",
       "JSIEC                                                     0   \n",
       "BioMediTech                                               0   \n",
       "NLM- Malaria Data                                         0   \n",
       "Diabetic Retinopathy                                      0   \n",
       "CoronaHack                                                0   \n",
       "Blood Cell                                                0   \n",
       "ISIC2020                                                  0   \n",
       "Yangxi                                                    0   \n",
       "MIAS                                                      0   \n",
       "MHSMA                                                     0   \n",
       "OCT & X-Ray 2017                                          0   \n",
       "ALL Challenge                                             0   \n",
       "Pulmonary Chest Shenzhen                                  0   \n",
       "PAD-UFES-20                                               0   \n",
       "Monkeypox Skin Image 2022                                 0   \n",
       "Covid CT                                                  0   \n",
       "CRC100k                                                   0   \n",
       "\n",
       "                           CT(Computed Tomography)  Microscopy Images  \\\n",
       "Chest CT Scan                                  871                  0   \n",
       "SARS-CoV-2 CT-scan                             910                  0   \n",
       "ISIC2019                                         0                  0   \n",
       "Adam Challenge                                   0                  0   \n",
       "OLIVES                                           0                  0   \n",
       "Mura                                             0                  0   \n",
       "ISBI2016                                         0                  0   \n",
       "Retinal OCT-C8                                   0                  0   \n",
       "ISIC2018                                         0                  0   \n",
       "Fitzpatrick 17k                                  0                  0   \n",
       "DeepDRiD                                         0                  0   \n",
       "BreakHis                                         0                735   \n",
       "MAlig Lymph                                      0                149   \n",
       "Knee Osteoarthritis                              0                  0   \n",
       "PALM2019                                         0                  0   \n",
       "HuSHeM                                           0                 89   \n",
       "Pulmonary Chest MC                               0                  0   \n",
       "ACRIMA                                           0                  0   \n",
       "Chest X-Ray PA                                   0                  0   \n",
       "COVIDx CXR-4                                     0                  0   \n",
       "DRIMDB                                           0                  0   \n",
       "Covid-19 tianchi                                 0                  0   \n",
       "RadImageNet                                  13829                  0   \n",
       "RUS CHN                                          0                  0   \n",
       "Covid19 heywhale                                 0                  0   \n",
       "JSIEC                                            0                  0   \n",
       "BioMediTech                                      0                511   \n",
       "NLM- Malaria Data                                0                 75   \n",
       "Diabetic Retinopathy                             0                  0   \n",
       "CoronaHack                                       0                  0   \n",
       "Blood Cell                                       0               1175   \n",
       "ISIC2020                                         0                  0   \n",
       "Yangxi                                           0                  0   \n",
       "MIAS                                             0                  0   \n",
       "MHSMA                                            0               1282   \n",
       "OCT & X-Ray 2017                                 0                  0   \n",
       "ALL Challenge                                    0                342   \n",
       "Pulmonary Chest Shenzhen                         0                  0   \n",
       "PAD-UFES-20                                      0                  0   \n",
       "Monkeypox Skin Image 2022                        0                  0   \n",
       "Covid CT                                       199                  0   \n",
       "CRC100k                                          0               1322   \n",
       "\n",
       "                           ultrasound  X-Ray  Dermoscopy  \n",
       "Chest CT Scan                       0      0           0  \n",
       "SARS-CoV-2 CT-scan                  0      0           0  \n",
       "ISIC2019                            0      0        1952  \n",
       "Adam Challenge                      0      0           0  \n",
       "OLIVES                              0      0           0  \n",
       "Mura                                0   1464           0  \n",
       "ISBI2016                            0      0         681  \n",
       "Retinal OCT-C8                      0      0           0  \n",
       "ISIC2018                            0      0         272  \n",
       "Fitzpatrick 17k                     0      0        1552  \n",
       "DeepDRiD                            0      0           0  \n",
       "BreakHis                            0      0           0  \n",
       "MAlig Lymph                         0      0           0  \n",
       "Knee Osteoarthritis                 0    518           0  \n",
       "PALM2019                            0      0           0  \n",
       "HuSHeM                              0      0           0  \n",
       "Pulmonary Chest MC                  0     38           0  \n",
       "ACRIMA                              0      0           0  \n",
       "Chest X-Ray PA                      0    850           0  \n",
       "COVIDx CXR-4                        0    485           0  \n",
       "DRIMDB                              0      0           0  \n",
       "Covid-19 tianchi                    0     96           0  \n",
       "RadImageNet                     10991      0           0  \n",
       "RUS CHN                             0   1982           0  \n",
       "Covid19 heywhale                    0    690           0  \n",
       "JSIEC                               0      0           0  \n",
       "BioMediTech                         0      0           0  \n",
       "NLM- Malaria Data                   0      0           0  \n",
       "Diabetic Retinopathy                0      0           0  \n",
       "CoronaHack                          0    684           0  \n",
       "Blood Cell                          0      0           0  \n",
       "ISIC2020                            0      0        1580  \n",
       "Yangxi                              0      0           0  \n",
       "MIAS                                0    142           0  \n",
       "MHSMA                               0      0           0  \n",
       "OCT & X-Ray 2017                    0    671           0  \n",
       "ALL Challenge                       0      0           0  \n",
       "Pulmonary Chest Shenzhen            0    296           0  \n",
       "PAD-UFES-20                         0      0         479  \n",
       "Monkeypox Skin Image 2022           0      0         163  \n",
       "Covid CT                            0      0           0  \n",
       "CRC100k                             0      0           0  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Modality Recognition</th>\n",
       "      <th>Other Biological Attributes</th>\n",
       "      <th>Anatomy Identification</th>\n",
       "      <th>Lesion Grading</th>\n",
       "      <th>Disease Diagnosis</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Chest CT Scan</th>\n",
       "      <td>10</td>\n",
       "      <td>268</td>\n",
       "      <td>0</td>\n",
       "      <td>268</td>\n",
       "      <td>325</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SARS-CoV-2 CT-scan</th>\n",
       "      <td>15</td>\n",
       "      <td>0</td>\n",
       "      <td>298</td>\n",
       "      <td>0</td>\n",
       "      <td>597</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISIC2019</th>\n",
       "      <td>315</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1637</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Adam Challenge</th>\n",
       "      <td>10</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>77</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>OLIVES</th>\n",
       "      <td>154</td>\n",
       "      <td>0</td>\n",
       "      <td>439</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Mura</th>\n",
       "      <td>252</td>\n",
       "      <td>0</td>\n",
       "      <td>424</td>\n",
       "      <td>0</td>\n",
       "      <td>788</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISBI2016</th>\n",
       "      <td>69</td>\n",
       "      <td>0</td>\n",
       "      <td>136</td>\n",
       "      <td>0</td>\n",
       "      <td>476</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Retinal OCT-C8</th>\n",
       "      <td>349</td>\n",
       "      <td>1697</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1970</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISIC2018</th>\n",
       "      <td>15</td>\n",
       "      <td>0</td>\n",
       "      <td>84</td>\n",
       "      <td>0</td>\n",
       "      <td>173</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Fitzpatrick 17k</th>\n",
       "      <td>265</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1287</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>DeepDRiD</th>\n",
       "      <td>131</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BreakHis</th>\n",
       "      <td>181</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>554</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>MAlig Lymph</th>\n",
       "      <td>14</td>\n",
       "      <td>0</td>\n",
       "      <td>60</td>\n",
       "      <td>0</td>\n",
       "      <td>75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Knee Osteoarthritis</th>\n",
       "      <td>518</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>PALM2019</th>\n",
       "      <td>117</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>393</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>HuSHeM</th>\n",
       "      <td>7</td>\n",
       "      <td>41</td>\n",
       "      <td>41</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Pulmonary Chest MC</th>\n",
       "      <td>4</td>\n",
       "      <td>0</td>\n",
       "      <td>6</td>\n",
       "      <td>0</td>\n",
       "      <td>28</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ACRIMA</th>\n",
       "      <td>34</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>125</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Chest X-Ray PA</th>\n",
       "      <td>63</td>\n",
       "      <td>0</td>\n",
       "      <td>252</td>\n",
       "      <td>0</td>\n",
       "      <td>535</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>COVIDx CXR-4</th>\n",
       "      <td>75</td>\n",
       "      <td>0</td>\n",
       "      <td>116</td>\n",
       "      <td>0</td>\n",
       "      <td>294</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>DRIMDB</th>\n",
       "      <td>10</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>122</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Covid-19 tianchi</th>\n",
       "      <td>10</td>\n",
       "      <td>0</td>\n",
       "      <td>20</td>\n",
       "      <td>0</td>\n",
       "      <td>66</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>RadImageNet</th>\n",
       "      <td>6306</td>\n",
       "      <td>17</td>\n",
       "      <td>10018</td>\n",
       "      <td>0</td>\n",
       "      <td>40356</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>RUS CHN</th>\n",
       "      <td>340</td>\n",
       "      <td>0</td>\n",
       "      <td>1642</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Covid19 heywhale</th>\n",
       "      <td>41</td>\n",
       "      <td>0</td>\n",
       "      <td>177</td>\n",
       "      <td>0</td>\n",
       "      <td>472</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>JSIEC</th>\n",
       "      <td>46</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>174</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BioMediTech</th>\n",
       "      <td>71</td>\n",
       "      <td>305</td>\n",
       "      <td>135</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>NLM- Malaria Data</th>\n",
       "      <td>8</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>67</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Diabetic Retinopathy</th>\n",
       "      <td>343</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1708</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoronaHack</th>\n",
       "      <td>101</td>\n",
       "      <td>0</td>\n",
       "      <td>251</td>\n",
       "      <td>0</td>\n",
       "      <td>332</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Blood Cell</th>\n",
       "      <td>229</td>\n",
       "      <td>0</td>\n",
       "      <td>946</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ISIC2020</th>\n",
       "      <td>368</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1212</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Yangxi</th>\n",
       "      <td>345</td>\n",
       "      <td>1170</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>MIAS</th>\n",
       "      <td>14</td>\n",
       "      <td>0</td>\n",
       "      <td>63</td>\n",
       "      <td>0</td>\n",
       "      <td>65</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>MHSMA</th>\n",
       "      <td>157</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1125</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>OCT &amp; X-Ray 2017</th>\n",
       "      <td>178</td>\n",
       "      <td>0</td>\n",
       "      <td>263</td>\n",
       "      <td>0</td>\n",
       "      <td>860</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ALL Challenge</th>\n",
       "      <td>69</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>273</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Pulmonary Chest Shenzhen</th>\n",
       "      <td>8</td>\n",
       "      <td>0</td>\n",
       "      <td>161</td>\n",
       "      <td>0</td>\n",
       "      <td>127</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>PAD-UFES-20</th>\n",
       "      <td>92</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>387</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Monkeypox Skin Image 2022</th>\n",
       "      <td>9</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>154</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Covid CT</th>\n",
       "      <td>28</td>\n",
       "      <td>0</td>\n",
       "      <td>62</td>\n",
       "      <td>0</td>\n",
       "      <td>109</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CRC100k</th>\n",
       "      <td>194</td>\n",
       "      <td>0</td>\n",
       "      <td>854</td>\n",
       "      <td>0</td>\n",
       "      <td>274</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                           Modality Recognition  Other Biological Attributes  \\\n",
       "Chest CT Scan                                10                          268   \n",
       "SARS-CoV-2 CT-scan                           15                            0   \n",
       "ISIC2019                                    315                            0   \n",
       "Adam Challenge                               10                            0   \n",
       "OLIVES                                      154                            0   \n",
       "Mura                                        252                            0   \n",
       "ISBI2016                                     69                            0   \n",
       "Retinal OCT-C8                              349                         1697   \n",
       "ISIC2018                                     15                            0   \n",
       "Fitzpatrick 17k                             265                            0   \n",
       "DeepDRiD                                    131                            0   \n",
       "BreakHis                                    181                            0   \n",
       "MAlig Lymph                                  14                            0   \n",
       "Knee Osteoarthritis                         518                            0   \n",
       "PALM2019                                    117                            0   \n",
       "HuSHeM                                        7                           41   \n",
       "Pulmonary Chest MC                            4                            0   \n",
       "ACRIMA                                       34                            0   \n",
       "Chest X-Ray PA                               63                            0   \n",
       "COVIDx CXR-4                                 75                            0   \n",
       "DRIMDB                                       10                            0   \n",
       "Covid-19 tianchi                             10                            0   \n",
       "RadImageNet                                6306                           17   \n",
       "RUS CHN                                     340                            0   \n",
       "Covid19 heywhale                             41                            0   \n",
       "JSIEC                                        46                            0   \n",
       "BioMediTech                                  71                          305   \n",
       "NLM- Malaria Data                             8                            0   \n",
       "Diabetic Retinopathy                        343                            0   \n",
       "CoronaHack                                  101                            0   \n",
       "Blood Cell                                  229                            0   \n",
       "ISIC2020                                    368                            0   \n",
       "Yangxi                                      345                         1170   \n",
       "MIAS                                         14                            0   \n",
       "MHSMA                                       157                            0   \n",
       "OCT & X-Ray 2017                            178                            0   \n",
       "ALL Challenge                                69                            0   \n",
       "Pulmonary Chest Shenzhen                      8                            0   \n",
       "PAD-UFES-20                                  92                            0   \n",
       "Monkeypox Skin Image 2022                     9                            0   \n",
       "Covid CT                                     28                            0   \n",
       "CRC100k                                     194                            0   \n",
       "\n",
       "                           Anatomy Identification  Lesion Grading  \\\n",
       "Chest CT Scan                                   0             268   \n",
       "SARS-CoV-2 CT-scan                            298               0   \n",
       "ISIC2019                                        0               0   \n",
       "Adam Challenge                                  0               0   \n",
       "OLIVES                                        439               0   \n",
       "Mura                                          424               0   \n",
       "ISBI2016                                      136               0   \n",
       "Retinal OCT-C8                                  0               0   \n",
       "ISIC2018                                       84               0   \n",
       "Fitzpatrick 17k                                 0               0   \n",
       "DeepDRiD                                        0               0   \n",
       "BreakHis                                        0               0   \n",
       "MAlig Lymph                                    60               0   \n",
       "Knee Osteoarthritis                             0               0   \n",
       "PALM2019                                        0               0   \n",
       "HuSHeM                                         41               0   \n",
       "Pulmonary Chest MC                              6               0   \n",
       "ACRIMA                                          0               0   \n",
       "Chest X-Ray PA                                252               0   \n",
       "COVIDx CXR-4                                  116               0   \n",
       "DRIMDB                                          0             122   \n",
       "Covid-19 tianchi                               20               0   \n",
       "RadImageNet                                 10018               0   \n",
       "RUS CHN                                      1642               0   \n",
       "Covid19 heywhale                              177               0   \n",
       "JSIEC                                           0               0   \n",
       "BioMediTech                                   135               0   \n",
       "NLM- Malaria Data                               0               0   \n",
       "Diabetic Retinopathy                            0            1708   \n",
       "CoronaHack                                    251               0   \n",
       "Blood Cell                                    946               0   \n",
       "ISIC2020                                        0               0   \n",
       "Yangxi                                          0               0   \n",
       "MIAS                                           63               0   \n",
       "MHSMA                                           0               0   \n",
       "OCT & X-Ray 2017                              263               0   \n",
       "ALL Challenge                                   0               0   \n",
       "Pulmonary Chest Shenzhen                      161               0   \n",
       "PAD-UFES-20                                     0               0   \n",
       "Monkeypox Skin Image 2022                       0               0   \n",
       "Covid CT                                       62               0   \n",
       "CRC100k                                       854               0   \n",
       "\n",
       "                           Disease Diagnosis  \n",
       "Chest CT Scan                            325  \n",
       "SARS-CoV-2 CT-scan                       597  \n",
       "ISIC2019                                1637  \n",
       "Adam Challenge                            77  \n",
       "OLIVES                                     0  \n",
       "Mura                                     788  \n",
       "ISBI2016                                 476  \n",
       "Retinal OCT-C8                          1970  \n",
       "ISIC2018                                 173  \n",
       "Fitzpatrick 17k                         1287  \n",
       "DeepDRiD                                   0  \n",
       "BreakHis                                 554  \n",
       "MAlig Lymph                               75  \n",
       "Knee Osteoarthritis                        0  \n",
       "PALM2019                                 393  \n",
       "HuSHeM                                     0  \n",
       "Pulmonary Chest MC                        28  \n",
       "ACRIMA                                   125  \n",
       "Chest X-Ray PA                           535  \n",
       "COVIDx CXR-4                             294  \n",
       "DRIMDB                                     0  \n",
       "Covid-19 tianchi                          66  \n",
       "RadImageNet                            40356  \n",
       "RUS CHN                                    0  \n",
       "Covid19 heywhale                         472  \n",
       "JSIEC                                    174  \n",
       "BioMediTech                                0  \n",
       "NLM- Malaria Data                         67  \n",
       "Diabetic Retinopathy                       0  \n",
       "CoronaHack                               332  \n",
       "Blood Cell                                 0  \n",
       "ISIC2020                                1212  \n",
       "Yangxi                                     0  \n",
       "MIAS                                      65  \n",
       "MHSMA                                   1125  \n",
       "OCT & X-Ray 2017                         860  \n",
       "ALL Challenge                            273  \n",
       "Pulmonary Chest Shenzhen                 127  \n",
       "PAD-UFES-20                              387  \n",
       "Monkeypox Skin Image 2022                154  \n",
       "Covid CT                                 109  \n",
       "CRC100k                                  274  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "display(modality_type_df)\n",
    "display(question_type_df)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "m1",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
