{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "537f929c-b3eb-4abf-a378-35c600fb1dd2",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\n\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\n\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\nCollecting accelerate>=0.31.0\n  Downloading accelerate-0.33.0-py3-none-any.whl (315 kB)\n\u001B[?25l     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m0.0/315.1 kB\u001B[0m \u001B[31m?\u001B[0m eta \u001B[36m-:--:--\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[90m╺\u001B[0m \u001B[32m307.2/315.1 kB\u001B[0m \u001B[31m9.8 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m315.1/315.1 kB\u001B[0m \u001B[31m8.0 MB/s\u001B[0m eta \u001B[36m0:00:00\u001B[0m\n\u001B[?25hCollecting huggingface-hub>=0.21.0\n  Downloading huggingface_hub-0.24.6-py3-none-any.whl (417 kB)\n\u001B[?25l     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m0.0/417.5 kB\u001B[0m \u001B[31m?\u001B[0m eta \u001B[36m-:--:--\u001B[0m\n\u001B[2K     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m417.5/417.5 kB\u001B[0m \u001B[31m15.1 MB/s\u001B[0m eta \u001B[36m0:00:00\u001B[0m\n\u001B[?25hRequirement already satisfied: numpy<2.0.0,>=1.17 in /databricks/python3/lib/python3.11/site-packages (from accelerate>=0.31.0) (1.23.5)\nRequirement already satisfied: pyyaml in /databricks/python3/lib/python3.11/site-packages (from accelerate>=0.31.0) (6.0)\nRequirement already satisfied: safetensors>=0.3.1 in /databricks/python3/lib/python3.11/site-packages (from accelerate>=0.31.0) (0.4.2)\nRequirement already satisfied: packaging>=20.0 in /databricks/python3/lib/python3.11/site-packages (from accelerate>=0.31.0) (23.2)\nRequirement already satisfied: torch>=1.10.0 in /databricks/python3/lib/python3.11/site-packages (from accelerate>=0.31.0) (2.2.2+cu121)\nRequirement already satisfied: psutil in /databricks/python3/lib/python3.11/site-packages (from accelerate>=0.31.0) (5.9.0)\nRequirement already satisfied: filelock in /databricks/python3/lib/python3.11/site-packages (from huggingface-hub>=0.21.0->accelerate>=0.31.0) (3.9.0)\nRequirement already satisfied: fsspec>=2023.5.0 in /databricks/python3/lib/python3.11/site-packages (from huggingface-hub>=0.21.0->accelerate>=0.31.0) (2023.5.0)\nRequirement already satisfied: tqdm>=4.42.1 in /databricks/python3/lib/python3.11/site-packages (from huggingface-hub>=0.21.0->accelerate>=0.31.0) (4.65.0)\nRequirement already satisfied: typing-extensions>=3.7.4.3 in /databricks/python3/lib/python3.11/site-packages (from huggingface-hub>=0.21.0->accelerate>=0.31.0) (4.10.0)\nRequirement already satisfied: requests in /databricks/python3/lib/python3.11/site-packages (from huggingface-hub>=0.21.0->accelerate>=0.31.0) (2.31.0)\nRequirement already satisfied: triton==2.2.0 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (2.2.0)\nRequirement already satisfied: nvidia-nvtx-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (12.1.105)\nRequirement already satisfied: nvidia-cuda-runtime-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (12.1.105)\nRequirement already satisfied: nvidia-cufft-cu12==11.0.2.54 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (11.0.2.54)\nRequirement already satisfied: nvidia-cudnn-cu12==8.9.2.26 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (8.9.2.26)\nRequirement already satisfied: nvidia-cuda-nvrtc-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (12.1.105)\nRequirement already satisfied: nvidia-curand-cu12==10.3.2.106 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (10.3.2.106)\nRequirement already satisfied: nvidia-cuda-cupti-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (12.1.105)\nRequirement already satisfied: nvidia-cublas-cu12==12.1.3.1 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (12.1.3.1)\nRequirement already satisfied: nvidia-nccl-cu12==2.19.3 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (2.19.3)\nRequirement already satisfied: nvidia-cusolver-cu12==11.4.5.107 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (11.4.5.107)\nRequirement already satisfied: jinja2 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (3.1.2)\nRequirement already satisfied: sympy in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (1.11.1)\nRequirement already satisfied: networkx in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (3.1)\nRequirement already satisfied: nvidia-cusparse-cu12==12.1.0.106 in /databricks/python3/lib/python3.11/site-packages (from torch>=1.10.0->accelerate>=0.31.0) (12.1.0.106)\nRequirement already satisfied: nvidia-nvjitlink-cu12 in /databricks/python3/lib/python3.11/site-packages (from nvidia-cusolver-cu12==11.4.5.107->torch>=1.10.0->accelerate>=0.31.0) (12.4.127)\nRequirement already satisfied: MarkupSafe>=2.0 in /databricks/python3/lib/python3.11/site-packages (from jinja2->torch>=1.10.0->accelerate>=0.31.0) (2.1.1)\nRequirement already satisfied: idna<4,>=2.5 in /databricks/python3/lib/python3.11/site-packages (from requests->huggingface-hub>=0.21.0->accelerate>=0.31.0) (3.4)\nRequirement already satisfied: certifi>=2017.4.17 in /databricks/python3/lib/python3.11/site-packages (from requests->huggingface-hub>=0.21.0->accelerate>=0.31.0) (2023.7.22)\nRequirement already satisfied: charset-normalizer<4,>=2 in /databricks/python3/lib/python3.11/site-packages (from requests->huggingface-hub>=0.21.0->accelerate>=0.31.0) (2.0.4)\nRequirement already satisfied: urllib3<3,>=1.21.1 in /databricks/python3/lib/python3.11/site-packages (from requests->huggingface-hub>=0.21.0->accelerate>=0.31.0) (1.26.16)\nRequirement already satisfied: mpmath>=0.19 in /databricks/python3/lib/python3.11/site-packages (from sympy->torch>=1.10.0->accelerate>=0.31.0) (1.3.0)\nInstalling collected packages: huggingface-hub, accelerate\n  Attempting uninstall: huggingface-hub\n    Found existing installation: huggingface-hub 0.20.2\n    Not uninstalling huggingface-hub at /databricks/python3/lib/python3.11/site-packages, outside environment /local_disk0/.ephemeral_nfs/envs/pythonEnv-25c3c754-023b-4beb-81a0-db84042570da\n    Can't uninstall 'huggingface-hub'. No files were found to uninstall.\n  Attempting uninstall: accelerate\n    Found existing installation: accelerate 0.28.0\n    Not uninstalling accelerate at /databricks/python3/lib/python3.11/site-packages, outside environment /local_disk0/.ephemeral_nfs/envs/pythonEnv-25c3c754-023b-4beb-81a0-db84042570da\n    Can't uninstall 'accelerate'. No files were found to uninstall.\nSuccessfully installed accelerate-0.33.0 huggingface-hub-0.24.6\n\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\n\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\nCollecting flash_attn>=2.5.8\n  Downloading flash_attn-2.6.3.tar.gz (2.6 MB)\n\u001B[?25l     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m0.0/2.6 MB\u001B[0m \u001B[31m?\u001B[0m eta \u001B[36m-:--:--\u001B[0m\n\u001B[2K     \u001B[91m━━━━━\u001B[0m\u001B[90m╺\u001B[0m\u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m0.4/2.6 MB\u001B[0m \u001B[31m10.8 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━━━━━━━\u001B[0m\u001B[91m╸\u001B[0m\u001B[90m━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m1.1/2.6 MB\u001B[0m \u001B[31m16.1 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[91m╸\u001B[0m\u001B[90m━━━━━━━━━\u001B[0m \u001B[32m2.0/2.6 MB\u001B[0m \u001B[31m19.9 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[91m╸\u001B[0m \u001B[32m2.6/2.6 MB\u001B[0m \u001B[31m21.9 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m2.6/2.6 MB\u001B[0m \u001B[31m18.7 MB/s\u001B[0m eta \u001B[36m0:00:00\u001B[0m\n\u001B[?25h  Preparing metadata (setup.py): started\n  Preparing metadata (setup.py): finished with status 'done'\nRequirement already satisfied: torch in /databricks/python3/lib/python3.11/site-packages (from flash_attn>=2.5.8) (2.2.2+cu121)\nRequirement already satisfied: einops in /databricks/python3/lib/python3.11/site-packages (from flash_attn>=2.5.8) (0.7.0)\nRequirement already satisfied: triton==2.2.0 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (2.2.0)\nRequirement already satisfied: nvidia-nvtx-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (12.1.105)\nRequirement already satisfied: nvidia-cuda-runtime-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (12.1.105)\nRequirement already satisfied: filelock in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (3.9.0)\nRequirement already satisfied: nvidia-cufft-cu12==11.0.2.54 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (11.0.2.54)\nRequirement already satisfied: nvidia-cudnn-cu12==8.9.2.26 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (8.9.2.26)\nRequirement already satisfied: typing-extensions>=4.8.0 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (4.10.0)\nRequirement already satisfied: nvidia-cuda-nvrtc-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (12.1.105)\nRequirement already satisfied: nvidia-curand-cu12==10.3.2.106 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (10.3.2.106)\nRequirement already satisfied: nvidia-cuda-cupti-cu12==12.1.105 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (12.1.105)\nRequirement already satisfied: nvidia-cublas-cu12==12.1.3.1 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (12.1.3.1)\nRequirement already satisfied: nvidia-nccl-cu12==2.19.3 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (2.19.3)\nRequirement already satisfied: fsspec in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (2023.5.0)\nRequirement already satisfied: nvidia-cusolver-cu12==11.4.5.107 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (11.4.5.107)\nRequirement already satisfied: jinja2 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (3.1.2)\nRequirement already satisfied: sympy in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (1.11.1)\nRequirement already satisfied: networkx in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (3.1)\nRequirement already satisfied: nvidia-cusparse-cu12==12.1.0.106 in /databricks/python3/lib/python3.11/site-packages (from torch->flash_attn>=2.5.8) (12.1.0.106)\nRequirement already satisfied: nvidia-nvjitlink-cu12 in /databricks/python3/lib/python3.11/site-packages (from nvidia-cusolver-cu12==11.4.5.107->torch->flash_attn>=2.5.8) (12.4.127)\nRequirement already satisfied: MarkupSafe>=2.0 in /databricks/python3/lib/python3.11/site-packages (from jinja2->torch->flash_attn>=2.5.8) (2.1.1)\nRequirement already satisfied: mpmath>=0.19 in /databricks/python3/lib/python3.11/site-packages (from sympy->torch->flash_attn>=2.5.8) (1.3.0)\nBuilding wheels for collected packages: flash_attn\n  Building wheel for flash_attn (setup.py): started\n  Building wheel for flash_attn (setup.py): finished with status 'done'\n  Created wheel for flash_attn: filename=flash_attn-2.6.3-cp311-cp311-linux_x86_64.whl size=187238747 sha256=230c3ba1e0650015eb65ef6a7e9849f0527bdc391cd1d5b971f8972c28516ab9\n  Stored in directory: /root/.cache/pip/wheels/e3/ef/b1/7889928ffa2dea61032e61480db4e4c20d00a9d9e28cd4f55a\nSuccessfully built flash_attn\nInstalling collected packages: flash_attn\n  Attempting uninstall: flash_attn\n    Found existing installation: flash-attn 2.5.6\n    Not uninstalling flash-attn at /databricks/python3/lib/python3.11/site-packages, outside environment /local_disk0/.ephemeral_nfs/envs/pythonEnv-25c3c754-023b-4beb-81a0-db84042570da\n    Can't uninstall 'flash-attn'. No files were found to uninstall.\nSuccessfully installed flash_attn-2.6.3\n\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\n"
     ]
    }
   ],
   "source": [
    "%pip install --quiet bitsandbytes \n",
    "%pip install 'accelerate>=0.31.0'\n",
    "%pip install 'flash_attn>=2.5.8'\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "43d46507-c0bc-4c0c-ab5c-2bf9df3bd558",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\nCollecting git+https://github.com/huggingface/transformers.git\n  Cloning https://github.com/huggingface/transformers.git to /tmp/pip-req-build-i8v99ilm\n  Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers.git /tmp/pip-req-build-i8v99ilm\n  Resolved https://github.com/huggingface/transformers.git to commit 0a7af19f4dc868bafc82f35eb7e8d13bac87a594\n  Installing build dependencies: started\n  Installing build dependencies: finished with status 'done'\n  Getting requirements to build wheel: started\n  Getting requirements to build wheel: finished with status 'done'\n  Preparing metadata (pyproject.toml): started\n  Preparing metadata (pyproject.toml): finished with status 'done'\nRequirement already satisfied: filelock in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (3.9.0)\nRequirement already satisfied: tqdm>=4.27 in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (4.65.0)\nRequirement already satisfied: safetensors>=0.4.1 in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (0.4.2)\nRequirement already satisfied: packaging>=20.0 in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (23.2)\nRequirement already satisfied: regex!=2019.12.17 in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (2022.7.9)\nRequirement already satisfied: pyyaml>=5.1 in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (6.0)\nRequirement already satisfied: numpy>=1.17 in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (1.23.5)\nCollecting tokenizers<0.20,>=0.19\n  Downloading tokenizers-0.19.1-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (3.6 MB)\n\u001B[?25l     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m0.0/3.6 MB\u001B[0m \u001B[31m?\u001B[0m eta \u001B[36m-:--:--\u001B[0m\n\u001B[2K     \u001B[91m━━━\u001B[0m\u001B[90m╺\u001B[0m\u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m0.3/3.6 MB\u001B[0m \u001B[31m9.7 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━\u001B[0m\u001B[91m╸\u001B[0m\u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m1.0/3.6 MB\u001B[0m \u001B[31m14.6 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[91m╸\u001B[0m\u001B[90m━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m1.8/3.6 MB\u001B[0m \u001B[31m17.9 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[91m╸\u001B[0m\u001B[90m━━━━━━━\u001B[0m \u001B[32m3.0/3.6 MB\u001B[0m \u001B[31m21.9 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[91m╸\u001B[0m \u001B[32m3.6/3.6 MB\u001B[0m \u001B[31m23.8 MB/s\u001B[0m eta \u001B[36m0:00:01\u001B[0m\n\u001B[2K     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m3.6/3.6 MB\u001B[0m \u001B[31m20.7 MB/s\u001B[0m eta \u001B[36m0:00:00\u001B[0m\n\u001B[?25hRequirement already satisfied: huggingface-hub<1.0,>=0.23.2 in /local_disk0/.ephemeral_nfs/envs/pythonEnv-25c3c754-023b-4beb-81a0-db84042570da/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (0.24.6)\nRequirement already satisfied: requests in /databricks/python3/lib/python3.11/site-packages (from transformers==4.45.0.dev0) (2.31.0)\nRequirement already satisfied: fsspec>=2023.5.0 in /databricks/python3/lib/python3.11/site-packages (from huggingface-hub<1.0,>=0.23.2->transformers==4.45.0.dev0) (2023.5.0)\nRequirement already satisfied: typing-extensions>=3.7.4.3 in /databricks/python3/lib/python3.11/site-packages (from huggingface-hub<1.0,>=0.23.2->transformers==4.45.0.dev0) (4.10.0)\nRequirement already satisfied: idna<4,>=2.5 in /databricks/python3/lib/python3.11/site-packages (from requests->transformers==4.45.0.dev0) (3.4)\nRequirement already satisfied: certifi>=2017.4.17 in /databricks/python3/lib/python3.11/site-packages (from requests->transformers==4.45.0.dev0) (2023.7.22)\nRequirement already satisfied: charset-normalizer<4,>=2 in /databricks/python3/lib/python3.11/site-packages (from requests->transformers==4.45.0.dev0) (2.0.4)\nRequirement already satisfied: urllib3<3,>=1.21.1 in /databricks/python3/lib/python3.11/site-packages (from requests->transformers==4.45.0.dev0) (1.26.16)\nBuilding wheels for collected packages: transformers\n  Building wheel for transformers (pyproject.toml): started\n  Building wheel for transformers (pyproject.toml): finished with status 'done'\n  Created wheel for transformers: filename=transformers-4.45.0.dev0-py3-none-any.whl size=9557614 sha256=f034073ecf2cdd2a000b9beaa8e12654b570dfa44e1f0b671fbae029325bd184\n  Stored in directory: /tmp/pip-ephem-wheel-cache-91eskly7/wheels/32/4b/78/f195c684dd3a9ed21f3b39fe8f85b48df7918581b6437be143\nSuccessfully built transformers\nInstalling collected packages: tokenizers, transformers\n  Attempting uninstall: tokenizers\n    Found existing installation: tokenizers 0.15.0\n    Not uninstalling tokenizers at /databricks/python3/lib/python3.11/site-packages, outside environment /local_disk0/.ephemeral_nfs/envs/pythonEnv-25c3c754-023b-4beb-81a0-db84042570da\n    Can't uninstall 'tokenizers'. No files were found to uninstall.\n  Attempting uninstall: transformers\n    Found existing installation: transformers 4.39.2\n    Not uninstalling transformers at /databricks/python3/lib/python3.11/site-packages, outside environment /local_disk0/.ephemeral_nfs/envs/pythonEnv-25c3c754-023b-4beb-81a0-db84042570da\n    Can't uninstall 'transformers'. No files were found to uninstall.\nSuccessfully installed tokenizers-0.19.1 transformers-4.45.0.dev0\n\u001B[43mNote: you may need to restart the kernel using %restart_python or dbutils.library.restartPython() to use updated packages.\u001B[0m\n"
     ]
    }
   ],
   "source": [
    "!pip install git+https://github.com/huggingface/transformers.git"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "fb22f5d0-ca94-45b2-9127-abe7a1c0621d",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "dbutils.library.restartPython()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "175aa550-9100-412b-9694-a1a7ccde31c4",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Please enter your Hugging Face token.\nYou can find your token at https://huggingface.co/settings/tokens\n"
     ]
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "HF Token:  [REDACTED]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Token is valid (permission: read).\nYour token has been saved in your configured git credential helpers (cache).\nYour token has been saved to /root/.cache/huggingface/token\nLogin successful\nSuccessfully logged in to Hugging Face!\n"
     ]
    }
   ],
   "source": [
    "# if the HF widget does not work!\n",
    "\n",
    "import os\n",
    "from huggingface_hub import login\n",
    "from getpass import getpass\n",
    "\n",
    "def hf_login():\n",
    "    # Check if the token is already set in the environment\n",
    "    if \"HF_TOKEN\" in os.environ:\n",
    "        print(\"Using Hugging Face token from environment variable.\")\n",
    "        token = os.environ[\"HF_TOKEN\"]\n",
    "    else:\n",
    "        # Prompt the user to enter their token\n",
    "        print(\"Please enter your Hugging Face token.\")\n",
    "        print(\"You can find your token at https://huggingface.co/settings/tokens\")\n",
    "        token = getpass(\"HF Token: \")\n",
    "    \n",
    "    # Attempt to log in\n",
    "    try:\n",
    "        login(token=token, add_to_git_credential=True)\n",
    "        print(\"Successfully logged in to Hugging Face!\")\n",
    "        \n",
    "        # Optionally, save the token to the environment for future use\n",
    "        os.environ[\"HF_TOKEN\"] = token\n",
    "    except Exception as e:\n",
    "        print(f\"Failed to log in. Error: {str(e)}\")\n",
    "\n",
    "# Call the function to log in\n",
    "hf_login()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "3ad10512-1383-4fce-8761-8c99ede5c9aa",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "2024-08-24 21:11:13.755032: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\nTo enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\nUnexpected internal error when monkey patching `Trainer.train`: Failed to import transformers.trainer because of the following error (look up to see its traceback):\nFailed to import transformers.integrations.integration_utils because of the following error (look up to see its traceback):\nFailed to import transformers.modeling_tf_utils because of the following error (look up to see its traceback):\nYour currently installed version of Keras is Keras 3, but this is not yet supported in Transformers. Please install the backwards-compatible tf-keras package with `pip install tf-keras`.\n"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score, confusion_matrix, classification_report, roc_auc_score\n",
    "import torch\n",
    "from transformers import AutoTokenizer, AutoModelForCausalLM\n",
    "import gc\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "4fd0210e-1709-464a-98ac-a26f673aa825",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "58a6585737224afbade2071942bddaa9",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "tokenizer_config.json:   0%|          | 0.00/55.4k [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e938b3c45ab344a7936a99a494f0c28c",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "tokenizer.json:   0%|          | 0.00/9.09M [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "0c40f90e33194f93b647e72702e1285b",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "special_tokens_map.json:   0%|          | 0.00/296 [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\nAnalysis of Training dataset:\nTotal number of rows: 1895\nNumber of unique CSNs: 482\nNotes per CSN:\n  Min: 1\n  Max: 4\n  Mean: 3.93\n  Median: 4.0\n\nClass distribution:\n  Class 1: 63.54%\n  Class 0: 36.46%\n\nNote type distribution:\n  Progress Notes: 67.49%\n  Discharge Summary: 30.13%\n  Plan of Care: 1.95%\n  Assessment: 0.42%\n\nLength statistics (in tokens):\n  Min: 5\n  Max: 27671\n  Mean: 2363.47\n  Median: 1940.0\n  95th percentile: 5710.80\n  99th percentile: 10148.96\n\nAnalysis of Development dataset:\nTotal number of rows: 376\nNumber of unique CSNs: 99\nNotes per CSN:\n  Min: 1\n  Max: 4\n  Mean: 3.80\n  Median: 4.0\n\nClass distribution:\n  Class 1: 66.22%\n  Class 0: 33.78%\n\nNote type distribution:\n  Progress Notes: 67.82%\n  Discharge Summary: 30.05%\n  Plan of Care: 1.06%\n  Assessment: 1.06%\n\nLength statistics (in tokens):\n  Min: 8\n  Max: 15402\n  Mean: 2189.73\n  Median: 1829.5\n  95th percentile: 5704.00\n  99th percentile: 7433.00\n\nAnalysis of Test dataset:\nTotal number of rows: 403\nNumber of unique CSNs: 103\nNotes per CSN:\n  Min: 1\n  Max: 4\n  Mean: 3.91\n  Median: 4.0\n\nClass distribution:\n  Class 1: 60.30%\n  Class 0: 39.70%\n\nNote type distribution:\n  Progress Notes: 67.99%\n  Discharge Summary: 29.53%\n  Assessment: 1.49%\n  Plan of Care: 0.99%\n\nLength statistics (in tokens):\n  Min: 8\n  Max: 16125\n  Mean: 2328.69\n  Median: 1902.0\n  95th percentile: 6236.30\n  99th percentile: 11862.16\n\nAnalysis of Combined dataset:\nTotal number of rows: 2674\nNumber of unique CSNs: 684\nNotes per CSN:\n  Min: 1\n  Max: 4\n  Mean: 3.91\n  Median: 4.0\n\nClass distribution:\n  Class 1: 63.43%\n  Class 0: 36.57%\n\nNote type distribution:\n  Progress Notes: 67.61%\n  Discharge Summary: 30.03%\n  Plan of Care: 1.68%\n  Assessment: 0.67%\n\nLength statistics (in tokens):\n  Min: 5\n  Max: 27671\n  Mean: 2333.80\n  Median: 1911.0\n  95th percentile: 5760.50\n  99th percentile: 10592.13\n"
     ]
    }
   ],
   "source": [
    "# Load the summarized datasets\n",
    "BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "\n",
    "train_df = pd.read_csv(f\"{BASE_DIR}/ihca_prediction_train_with_summaries.csv\")\n",
    "dev_df = pd.read_csv(f\"{BASE_DIR}/ihca_prediction_dev_with_summaries.csv\")\n",
    "test_df = pd.read_csv(f\"{BASE_DIR}/ihca_prediction_test_with_summaries.csv\")\n",
    "\n",
    "# Combine all datasets for this example\n",
    "all_data = pd.concat([train_df, dev_df, test_df], ignore_index=True)\n",
    "\n",
    "# Load the tokenizer\n",
    "tokenizer = AutoTokenizer.from_pretrained(\"meta-llama/Meta-Llama-3.1-8B-Instruct\")\n",
    "\n",
    "# COMMAND ----------\n",
    "\n",
    "def count_tokens(text):\n",
    "    return len(tokenizer.encode(text))\n",
    "\n",
    "def analyze_dataset(df, name):\n",
    "    print(f\"\\nAnalysis of {name} dataset:\")\n",
    "    print(f\"Total number of rows: {len(df)}\")\n",
    "    print(f\"Number of unique CSNs: {df['csn'].nunique()}\")\n",
    "    \n",
    "    notes_per_csn = df.groupby('csn').size()\n",
    "    print(f\"Notes per CSN:\")\n",
    "    print(f\"  Min: {notes_per_csn.min()}\")\n",
    "    print(f\"  Max: {notes_per_csn.max()}\")\n",
    "    print(f\"  Mean: {notes_per_csn.mean():.2f}\")\n",
    "    print(f\"  Median: {notes_per_csn.median()}\")\n",
    "    \n",
    "    class_distribution = df['cardiac_arrest'].value_counts(normalize=True) * 100\n",
    "    print(\"\\nClass distribution:\")\n",
    "    for class_label, percentage in class_distribution.items():\n",
    "        print(f\"  Class {class_label}: {percentage:.2f}%\")\n",
    "    \n",
    "    print(\"\\nNote type distribution:\")\n",
    "    note_type_dist = df['ip_note_type'].value_counts(normalize=True) * 100\n",
    "    for note_type, percentage in note_type_dist.head().items():\n",
    "        print(f\"  {note_type}: {percentage:.2f}%\")\n",
    "    \n",
    "    # Count tokens for each summary\n",
    "    df['token_count'] = df['note_text'].apply(count_tokens)\n",
    "    \n",
    "    print(\"\\nLength statistics (in tokens):\")\n",
    "    print(f\"  Min: {df['token_count'].min()}\")\n",
    "    print(f\"  Max: {df['token_count'].max()}\")\n",
    "    print(f\"  Mean: {df['token_count'].mean():.2f}\")\n",
    "    print(f\"  Median: {df['token_count'].median()}\")\n",
    "    print(f\"  95th percentile: {df['token_count'].quantile(0.95):.2f}\")\n",
    "    print(f\"  99th percentile: {df['token_count'].quantile(0.99):.2f}\")\n",
    "    \n",
    "    return df\n",
    "\n",
    "# Analyze each dataset\n",
    "train_df = analyze_dataset(train_df, \"Training\")\n",
    "dev_df = analyze_dataset(dev_df, \"Development\")\n",
    "test_df = analyze_dataset(test_df, \"Test\")\n",
    "all_data = analyze_dataset(all_data, \"Combined\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "53b89e89-8f2f-48f1-9646-492f1e023706",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "bf814050a23646e8aeacbce305e18ff6",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "config.json:   0%|          | 0.00/903 [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "9faafa0fb5c44399a309634a1e7bbbca",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "model.safetensors.index.json:   0%|          | 0.00/23.9k [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "3e02679dd938427aa282956b51f29eb5",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Downloading shards:   0%|          | 0/4 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "b560e42bd6c4420c95cac42c86a22f01",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "model-00001-of-00004.safetensors:   0%|          | 0.00/4.98G [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "011c944c30da428c87b96093daf9b483",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "model-00002-of-00004.safetensors:   0%|          | 0.00/5.00G [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "640ba6f72bf14e0fbcedd2e675fbfddd",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "model-00003-of-00004.safetensors:   0%|          | 0.00/4.92G [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "7dba1c6635194428b322b4abb261f6e4",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "model-00004-of-00004.safetensors:   0%|          | 0.00/1.17G [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "d25fcfcfbdfd4ee5a80850d1110a4588",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Loading checkpoint shards:   0%|          | 0/4 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "92959643c5f941e380d0c5b93e77474a",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "generation_config.json:   0%|          | 0.00/189 [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "import torch\n",
    "from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig\n",
    "\n",
    "tokenizer = AutoTokenizer.from_pretrained(\"meta-llama/Meta-Llama-3.1-8B-Instruct\")\n",
    "model = AutoModelForCausalLM.from_pretrained(\"meta-llama/Meta-Llama-3.1-8B-Instruct\")\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "d75a847e-5b35-42b9-a0c2-17ca41f6eecc",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\nTo disable this warning, you can either:\n\t- Avoid using `tokenizers` before the fork if possible\n\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Fri Aug 23 17:01:41 2024       \r\n+---------------------------------------------------------------------------------------+\r\n| NVIDIA-SMI 535.54.03              Driver Version: 535.54.03    CUDA Version: 12.2     |\r\n|-----------------------------------------+----------------------+----------------------+\r\n| GPU  Name                 Persistence-M | Bus-Id        Disp.A | Volatile Uncorr. ECC |\r\n| Fan  Temp   Perf          Pwr:Usage/Cap |         Memory-Usage | GPU-Util  Compute M. |\r\n|                                         |                      |               MIG M. |\r\n|=========================================+======================+======================|\r\n|   0  NVIDIA A100 80GB PCIe          Off | 00000001:00:00.0 Off |                    0 |\r\n| N/A   34C    P0              47W / 300W |      9MiB / 81920MiB |      0%      Default |\r\n|                                         |                      |             Disabled |\r\n+-----------------------------------------+----------------------+----------------------+\r\n                                                                                         \r\n+---------------------------------------------------------------------------------------+\r\n| Processes:                                                                            |\r\n|  GPU   GI   CI        PID   Type   Process name                            GPU Memory |\r\n|        ID   ID                                                             Usage      |\r\n|=======================================================================================|\r\n|  No running processes found                                                           |\r\n+---------------------------------------------------------------------------------------+\r\n"
     ]
    }
   ],
   "source": [
    "!nvidia-smi"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "acfc0a19-81e5-4830-abfb-c36ca4d8fec6",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import torch\n",
    "from tqdm import tqdm\n",
    "from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score, confusion_matrix\n",
    "import seaborn as sns\n",
    "import matplotlib.pyplot as plt\n",
    "import gc\n",
    "from transformers import AutoTokenizer, AutoModelForCausalLM\n",
    "\n",
    "def load_model(model_name):\n",
    "    tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
    "    model = AutoModelForCausalLM.from_pretrained(\n",
    "        model_name,\n",
    "        device_map=\"auto\",\n",
    "        torch_dtype=torch.float16,\n",
    "        low_cpu_mem_usage=True,\n",
    "    )\n",
    "    model.eval()  # Set the model to evaluation mode\n",
    "    return tokenizer, model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "09343277-e863-47c1-af2f-a083cf4a8420",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "# Define prompts\n",
    "\n",
    "INSTRUCTION_PROMPT = \"\"\"\n",
    "Given the patient's notes summary, assess whether the patient had an in-hospital cardiac arrest (IHCA) event.\n",
    "IHCA refers to a cardiac arrest that occurs in an inpatient setting where the patient is admitted and receiving care.\n",
    "Cardiac arrests occurring in outpatient settings, such as the hospital's cafeteria or during a visit, do not count as IHCA.\n",
    "Cardiac arrest refers to the sudden loss of cardiac function leading to a lack of a pulse or signs requiring that the patient receives chest compressions, or ACLS.\n",
    "\n",
    "Steps to determine IHCA:\n",
    "1. Identify if there is a mention of cardiac arrest.\n",
    "2. Determine if the cardiac arrest occurred in an inpatient setting.\n",
    "3. Confirm if the patient received chest compressions.\n",
    "\n",
    "Respond with 'positive' or 'negative' and give your rationale.\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "392f1110-1b58-41c9-82f0-7422638f8073",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "def get_prediction_with_rationale(summary, model, tokenizer, temperature=0.5):\n",
    "    prompt = f\"\\n\\n{INSTRUCTION_PROMPT}\\n{summary}\\n\\n Your response (positive/negative): \"\n",
    "    inputs = tokenizer(prompt, return_tensors=\"pt\", max_length=7000, truncation=True)\n",
    "    \n",
    "    # Check if the model accepts token_type_ids\n",
    "    model_input_names = getattr(model.config, 'model_input_names', [])\n",
    "    \n",
    "    # If token_type_ids is not in model_input_names, remove it from inputs\n",
    "    if 'token_type_ids' not in model_input_names and 'token_type_ids' in inputs:\n",
    "        del inputs['token_type_ids']\n",
    "    \n",
    "    # Move inputs to the appropriate device\n",
    "    inputs = {k: v.to(model.device) for k, v in inputs.items()}\n",
    "    \n",
    "    # Set up generation kwargs\n",
    "    generation_kwargs = {\n",
    "        \"max_new_tokens\": 200,\n",
    "        \"temperature\": temperature,\n",
    "        \"do_sample\": True,\n",
    "        \"top_p\": 0.95,\n",
    "        \"num_return_sequences\": 1,\n",
    "        \"no_repeat_ngram_size\": 3,\n",
    "    }\n",
    "    \n",
    "    # Add pad_token_id and eos_token_id if they exist in the tokenizer\n",
    "    if hasattr(tokenizer, 'eos_token_id'):\n",
    "        generation_kwargs[\"eos_token_id\"] = tokenizer.eos_token_id\n",
    "    if hasattr(tokenizer, 'pad_token_id'):\n",
    "        generation_kwargs[\"pad_token_id\"] = tokenizer.pad_token_id\n",
    "    \n",
    "    with torch.no_grad():\n",
    "        outputs = model.generate(\n",
    "            **inputs,\n",
    "            **generation_kwargs\n",
    "        )\n",
    "    \n",
    "    model_response = tokenizer.decode(outputs[0][inputs['input_ids'].shape[1]:], skip_special_tokens=True).strip()\n",
    "    \n",
    "    # Determine the prediction based on the model response\n",
    "    response_lower = model_response.lower()\n",
    "    if any(word in response_lower for word in [\"positive\", \"yes\"]):\n",
    "        prediction = 1\n",
    "    elif any(word in response_lower for word in [\"negative\", \"no\"]):\n",
    "        prediction = 0\n",
    "    else:\n",
    "        positive_indicators = ['cardiac arrest occurred', 'ihca event', 'in-hospital cardiac arrest confirmed']\n",
    "        negative_indicators = ['no cardiac arrest', 'no mention of cardiac arrest', 'no ihca', 'not an ihca event']\n",
    "        \n",
    "        if any(indicator in response_lower for indicator in positive_indicators):\n",
    "            prediction = 1\n",
    "        elif any(indicator in response_lower for indicator in negative_indicators):\n",
    "            prediction = 0\n",
    "        else:\n",
    "            prediction = 0\n",
    "    \n",
    "    # Return both the prediction and the full model response\n",
    "    return prediction, model_response"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "c357d827-3742-47dd-abaa-140c28af3b09",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "def generate_predictions_with_rationales(df, model, tokenizer, batch_size=5, temperature=0.2):\n",
    "    predictions = []\n",
    "    rationales = []\n",
    "    \n",
    "    progress_bar = tqdm(total=len(df), desc=\"Generating predictions\", unit=\"sample\")\n",
    "    \n",
    "    for i in range(0, len(df), batch_size):\n",
    "        batch = df.iloc[i:i+batch_size]\n",
    "        \n",
    "        batch_predictions = []\n",
    "        batch_rationales = []\n",
    "        \n",
    "        for _, row in batch.iterrows():\n",
    "            prediction, rationale = get_prediction_with_rationale(row['note_text'], model, tokenizer, temperature)\n",
    "            batch_predictions.append(prediction)\n",
    "            batch_rationales.append(rationale)\n",
    "        \n",
    "        predictions.extend(batch_predictions)\n",
    "        rationales.extend(batch_rationales)\n",
    "        \n",
    "        progress_bar.update(batch_size)\n",
    "        \n",
    "        # Clear CUDA cache and collect garbage\n",
    "        if torch.cuda.is_available():\n",
    "            torch.cuda.empty_cache()\n",
    "        gc.collect()\n",
    "    \n",
    "    progress_bar.close()\n",
    "    \n",
    "    return predictions, rationales\n",
    "\n",
    "def majority_vote(group):\n",
    "    return 1 if group['predicted_ihca'].mean() >= 0.01 else 0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "10a176d3-5a3d-4847-a6cc-2093c91e77a8",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "import json\n",
    "import os\n",
    "from datetime import datetime\n",
    "\n",
    "def save_model_results(model_name, test_data, csn_results, metrics, confusion_matrix):\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    \n",
    "    # Create the results directory if it doesn't exist\n",
    "    os.makedirs(RESULTS_DIR, exist_ok=True)\n",
    "    \n",
    "    # Create a timestamp for the filename\n",
    "    timestamp = datetime.now().strftime(\"%Y%m%d_%H%M%S\")\n",
    "    filename = f\"{model_name.replace('/', '_')}_{timestamp}.json\"\n",
    "    \n",
    "    # Prepare the results dictionary\n",
    "    results = {\n",
    "        \"model_name\": model_name,\n",
    "        \"timestamp\": timestamp,\n",
    "        \"metrics\": metrics,\n",
    "        \"confusion_matrix\": confusion_matrix.tolist(),\n",
    "        \"predictions\": test_data[['csn', 'predicted_ihca', 'rationale']].to_dict('records'),\n",
    "        \"csn_results\": csn_results[['csn', 'predicted_ihca', 'cardiac_arrest']].to_dict('records')\n",
    "    }\n",
    "    \n",
    "    # Save the results to a JSON file\n",
    "    file_path = os.path.join(RESULTS_DIR, filename)\n",
    "    with open(file_path, 'w') as f:\n",
    "        json.dump(results, f, indent=2)\n",
    "    \n",
    "    print(f\"Results saved to {file_path}\")\n",
    "    \n",
    "    # Also save CSN-level results to a CSV file\n",
    "    csv_filename = f\"{model_name.replace('/', '_')}_{timestamp}_results.csv\"\n",
    "    csv_path = os.path.join(RESULTS_DIR, csv_filename)\n",
    "    csn_results.to_csv(csv_path, index=False)\n",
    "    print(f\"CSV results saved to {csv_path}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "6d5e63b4-aef5-42f6-a8e4-8591d6647340",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "import json\n",
    "import os\n",
    "from datetime import datetime\n",
    "\n",
    "def save_model_results(model_name, test_data, csn_results, metrics, confusion_matrix):\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    \n",
    "    # Create the results directory if it doesn't exist\n",
    "    os.makedirs(RESULTS_DIR, exist_ok=True)\n",
    "    \n",
    "    # Create a timestamp for the filename\n",
    "    timestamp = datetime.now().strftime(\"%Y%m%d_%H%M%S\")\n",
    "    # Replace forward slashes in model name with underscores\n",
    "    safe_model_name = model_name.replace('/', '_')\n",
    "    filename = f\"{safe_model_name}_{timestamp}.json\"\n",
    "    \n",
    "    # Prepare the results dictionary\n",
    "    results = {\n",
    "        \"model_name\": model_name,\n",
    "        \"timestamp\": timestamp,\n",
    "        \"metrics\": metrics,\n",
    "        \"confusion_matrix\": confusion_matrix.tolist(),\n",
    "        \"predictions\": test_data[['csn', 'predicted_ihca', 'rationale']].to_dict('records'),\n",
    "        \"csn_results\": csn_results[['csn', 'predicted_ihca', 'cardiac_arrest']].to_dict('records')\n",
    "    }\n",
    "    \n",
    "    # Save the results to a JSON file\n",
    "    file_path = os.path.join(RESULTS_DIR, filename)\n",
    "    try:\n",
    "        with open(file_path, 'w') as f:\n",
    "            json.dump(results, f, indent=2)\n",
    "        print(f\"Results saved to {file_path}\")\n",
    "    except IOError as e:\n",
    "        print(f\"Error saving results to {file_path}: {e}\")\n",
    "        # Try saving to a different location\n",
    "        alt_file_path = f\"/dbfs/FileStore/{filename}\"\n",
    "        with open(alt_file_path, 'w') as f:\n",
    "            json.dump(results, f, indent=2)\n",
    "        print(f\"Results saved to alternative location: {alt_file_path}\")\n",
    "    \n",
    "    # Also save CSN-level results to a CSV file\n",
    "    csv_filename = f\"{safe_model_name}_{timestamp}_results.csv\"\n",
    "    csv_path = os.path.join(RESULTS_DIR, csv_filename)\n",
    "    try:\n",
    "        csn_results.to_csv(csv_path, index=False)\n",
    "        print(f\"CSV results saved to {csv_path}\")\n",
    "    except IOError as e:\n",
    "        print(f\"Error saving CSV to {csv_path}: {e}\")\n",
    "        # Try saving to a different location\n",
    "        alt_csv_path = f\"/dbfs/FileStore/{csv_filename}\"\n",
    "        csn_results.to_csv(alt_csv_path, index=False)\n",
    "        print(f\"CSV results saved to alternative location: {alt_csv_path}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "2fa104ba-b9f1-42b0-9856-04c25263b3a3",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [],
   "source": [
    "def test_run(data, model, tokenizer, model_name, num_samples=10, random_state=None, batch_size=1):\n",
    "    test_data = data.sample(n=num_samples, random_state=random_state) if random_state else data.sample(n=num_samples)\n",
    "    \n",
    "    print(f\"Running test prediction on {num_samples} samples...\")\n",
    "    \n",
    "    predictions, rationales = generate_predictions_with_rationales(test_data, model, tokenizer, batch_size=batch_size)\n",
    "    \n",
    "    test_data['predicted_ihca'] = predictions\n",
    "    test_data['rationale'] = rationales\n",
    "    \n",
    "    # Perform majority voting at CSN level\n",
    "    csn_predictions = test_data.groupby('csn').apply(majority_vote).reset_index()\n",
    "    csn_predictions.columns = ['csn', 'predicted_ihca']\n",
    "    \n",
    "    # Merge back to get actual IHCA status\n",
    "    csn_actual = test_data.groupby('csn')['cardiac_arrest'].first().reset_index()\n",
    "    csn_results = pd.merge(csn_predictions, csn_actual, on='csn')\n",
    "    \n",
    "    # Calculate metrics\n",
    "    accuracy = accuracy_score(csn_results['cardiac_arrest'], csn_results['predicted_ihca'])\n",
    "    precision = precision_score(csn_results['cardiac_arrest'], csn_results['predicted_ihca'])\n",
    "    recall = recall_score(csn_results['cardiac_arrest'], csn_results['predicted_ihca'])\n",
    "    f1 = f1_score(csn_results['cardiac_arrest'], csn_results['predicted_ihca'])\n",
    "    \n",
    "    metrics = {\n",
    "        \"accuracy\": accuracy,\n",
    "        \"precision\": precision,\n",
    "        \"recall\": recall,\n",
    "        \"f1_score\": f1\n",
    "    }\n",
    "    \n",
    "    # Generate confusion matrix\n",
    "    cm = confusion_matrix(csn_results['cardiac_arrest'], csn_results['predicted_ihca'])\n",
    "    \n",
    "    # Save the results\n",
    "    save_model_results(model_name, test_data, csn_results, metrics, cm)\n",
    "    \n",
    "    # Print results and plot confusion matrix as before\n",
    "    print(\"\\nTest Metrics (CSN level):\")\n",
    "    for metric, value in metrics.items():\n",
    "        print(f\"{metric.capitalize()}: {value:.2f}\")\n",
    "    \n",
    "    plt.figure(figsize=(10,7))\n",
    "    sns.heatmap(cm, annot=True, fmt='d', cmap='Blues')\n",
    "    plt.title(f'Confusion Matrix (CSN level) - {model_name}')\n",
    "    plt.ylabel('Actual')\n",
    "    plt.xlabel('Predicted')\n",
    "    plt.show()\n",
    "    \n",
    "    return test_data, csn_results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "73f7bde5-ba1c-4394-9a6f-93e679390972",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "99b83b2b39094396a19697785cef00e6",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Loading checkpoint shards:   0%|          | 0/4 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# Load the model with optimizations\n",
    "model_name = \"meta-llama/Meta-Llama-3.1-8B-Instruct\"\n",
    "tokenizer, model = load_model(model_name)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "f45d1a93-5feb-40d9-92b4-097ce0cc19c4",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Running test prediction on 1000 samples...\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\rGenerating predictions:   0%|          | 0/1000 [00:00<?, ?sample/s]\rGenerating predictions:   0%|          | 5/1000 [00:03<11:25,  1.45sample/s]\rGenerating predictions:   1%|          | 10/1000 [00:16<30:25,  1.84s/sample]\rGenerating predictions:   2%|▏         | 15/1000 [00:21<24:20,  1.48s/sample]\rGenerating predictions:   2%|▏         | 20/1000 [00:37<34:21,  2.10s/sample]\rGenerating predictions:   2%|▎         | 25/1000 [00:45<32:03,  1.97s/sample]\rGenerating predictions:   3%|▎         | 30/1000 [00:54<30:56,  1.91s/sample]\rGenerating predictions:   4%|▎         | 35/1000 [01:07<33:50,  2.10s/sample]\rGenerating predictions:   4%|▍         | 40/1000 [01:19<35:21,  2.21s/sample]\rGenerating predictions:   4%|▍         | 45/1000 [01:28<32:37,  2.05s/sample]\rGenerating predictions:   5%|▌         | 50/1000 [01:41<35:13,  2.22s/sample]\rGenerating predictions:   6%|▌         | 55/1000 [01:58<41:20,  2.62s/sample]\rGenerating predictions:   6%|▌         | 60/1000 [02:07<36:59,  2.36s/sample]\rGenerating predictions:   6%|▋         | 65/1000 [02:15<32:37,  2.09s/sample]\rGenerating predictions:   7%|▋         | 70/1000 [02:29<36:03,  2.33s/sample]\rGenerating predictions:   8%|▊         | 75/1000 [02:49<43:41,  2.83s/sample]\rGenerating predictions:   8%|▊         | 80/1000 [03:04<44:03,  2.87s/sample]\rGenerating predictions:   8%|▊         | 85/1000 [03:10<36:38,  2.40s/sample]\rGenerating predictions:   9%|▉         | 90/1000 [03:22<36:05,  2.38s/sample]\rGenerating predictions:  10%|▉         | 95/1000 [03:40<41:45,  2.77s/sample]\rGenerating predictions:  10%|█         | 100/1000 [03:55<42:02,  2.80s/sample]\rGenerating predictions:  10%|█         | 105/1000 [04:01<35:21,  2.37s/sample]\rGenerating predictions:  11%|█         | 110/1000 [04:17<38:23,  2.59s/sample]\rGenerating predictions:  12%|█▏        | 115/1000 [04:25<33:29,  2.27s/sample]\rGenerating predictions:  12%|█▏        | 120/1000 [04:30<28:08,  1.92s/sample]\rGenerating predictions:  12%|█▎        | 125/1000 [04:42<30:22,  2.08s/sample]\rGenerating predictions:  13%|█▎        | 130/1000 [04:53<29:58,  2.07s/sample]\rGenerating predictions:  14%|█▎        | 135/1000 [05:05<31:34,  2.19s/sample]\rGenerating predictions:  14%|█▍        | 140/1000 [05:11<27:32,  1.92s/sample]\rGenerating predictions:  14%|█▍        | 145/1000 [05:31<35:48,  2.51s/sample]\rGenerating predictions:  15%|█▌        | 150/1000 [05:41<33:45,  2.38s/sample]\rGenerating predictions:  16%|█▌        | 155/1000 [05:49<30:09,  2.14s/sample]\rGenerating predictions:  16%|█▌        | 160/1000 [05:53<23:49,  1.70s/sample]\rGenerating predictions:  16%|█▋        | 165/1000 [06:02<24:46,  1.78s/sample]\rGenerating predictions:  17%|█▋        | 170/1000 [06:15<27:39,  2.00s/sample]\rGenerating predictions:  18%|█▊        | 175/1000 [06:28<30:24,  2.21s/sample]\rGenerating predictions:  18%|█▊        | 180/1000 [06:34<25:47,  1.89s/sample]\rGenerating predictions:  18%|█▊        | 185/1000 [06:41<23:40,  1.74s/sample]\rGenerating predictions:  19%|█▉        | 190/1000 [06:50<23:12,  1.72s/sample]\rGenerating predictions:  20%|█▉        | 195/1000 [06:57<22:24,  1.67s/sample]\rGenerating predictions:  20%|██        | 200/1000 [07:07<22:58,  1.72s/sample]\rGenerating predictions:  20%|██        | 205/1000 [07:13<20:52,  1.58s/sample]\rGenerating predictions:  21%|██        | 210/1000 [07:24<23:47,  1.81s/sample]\rGenerating predictions:  22%|██▏       | 215/1000 [07:31<21:30,  1.64s/sample]\rGenerating predictions:  22%|██▏       | 220/1000 [07:38<20:46,  1.60s/sample]\rGenerating predictions:  22%|██▎       | 225/1000 [07:53<25:57,  2.01s/sample]\rGenerating predictions:  23%|██▎       | 230/1000 [08:07<29:06,  2.27s/sample]\rGenerating predictions:  24%|██▎       | 235/1000 [08:24<33:18,  2.61s/sample]\rGenerating predictions:  24%|██▍       | 240/1000 [08:33<29:56,  2.36s/sample]\rGenerating predictions:  24%|██▍       | 245/1000 [08:49<32:20,  2.57s/sample]\rGenerating predictions:  25%|██▌       | 250/1000 [09:06<35:16,  2.82s/sample]\rGenerating predictions:  26%|██▌       | 255/1000 [09:12<29:15,  2.36s/sample]\rGenerating predictions:  26%|██▌       | 260/1000 [09:18<24:45,  2.01s/sample]\rGenerating predictions:  26%|██▋       | 265/1000 [09:26<23:00,  1.88s/sample]\rGenerating predictions:  27%|██▋       | 270/1000 [09:34<21:59,  1.81s/sample]\rGenerating predictions:  28%|██▊       | 275/1000 [09:46<24:05,  1.99s/sample]\rGenerating predictions:  28%|██▊       | 280/1000 [09:55<23:24,  1.95s/sample]\rGenerating predictions:  28%|██▊       | 285/1000 [10:02<20:59,  1.76s/sample]\rGenerating predictions:  29%|██▉       | 290/1000 [10:10<20:11,  1.71s/sample]\rGenerating predictions:  30%|██▉       | 295/1000 [10:23<22:56,  1.95s/sample]\rGenerating predictions:  30%|███       | 300/1000 [10:34<24:08,  2.07s/sample]\rGenerating predictions:  30%|███       | 305/1000 [10:43<22:58,  1.98s/sample]\rGenerating predictions:  31%|███       | 310/1000 [10:49<20:07,  1.75s/sample]\rGenerating predictions:  32%|███▏      | 315/1000 [11:01<21:57,  1.92s/sample]\rGenerating predictions:  32%|███▏      | 320/1000 [11:12<22:30,  1.99s/sample]\rGenerating predictions:  32%|███▎      | 325/1000 [11:26<25:33,  2.27s/sample]\rGenerating predictions:  33%|███▎      | 330/1000 [11:34<23:16,  2.08s/sample]\rGenerating predictions:  34%|███▎      | 335/1000 [11:44<22:11,  2.00s/sample]\rGenerating predictions:  34%|███▍      | 340/1000 [11:55<22:57,  2.09s/sample]\rGenerating predictions:  34%|███▍      | 345/1000 [12:03<21:19,  1.95s/sample]\rGenerating predictions:  35%|███▌      | 350/1000 [12:16<22:50,  2.11s/sample]\rGenerating predictions:  36%|███▌      | 355/1000 [12:26<22:27,  2.09s/sample]\rGenerating predictions:  36%|███▌      | 360/1000 [12:45<28:07,  2.64s/sample]\rGenerating predictions:  36%|███▋      | 365/1000 [12:56<26:23,  2.49s/sample]\rGenerating predictions:  37%|███▋      | 370/1000 [13:07<25:22,  2.42s/sample]\rGenerating predictions:  38%|███▊      | 375/1000 [13:14<22:02,  2.12s/sample]\rGenerating predictions:  38%|███▊      | 380/1000 [13:20<18:52,  1.83s/sample]\rGenerating predictions:  38%|███▊      | 385/1000 [13:32<20:25,  1.99s/sample]\rGenerating predictions:  39%|███▉      | 390/1000 [13:48<23:52,  2.35s/sample]\rGenerating predictions:  40%|███▉      | 395/1000 [13:57<22:12,  2.20s/sample]\rGenerating predictions:  40%|████      | 400/1000 [14:03<18:44,  1.87s/sample]\rGenerating predictions:  40%|████      | 405/1000 [14:16<20:37,  2.08s/sample]\rGenerating predictions:  41%|████      | 410/1000 [14:28<21:28,  2.18s/sample]\rGenerating predictions:  42%|████▏     | 415/1000 [14:42<22:59,  2.36s/sample]\rGenerating predictions:  42%|████▏     | 420/1000 [14:47<19:18,  2.00s/sample]\rGenerating predictions:  42%|████▎     | 425/1000 [14:54<17:04,  1.78s/sample]\rGenerating predictions:  43%|████▎     | 430/1000 [15:05<18:03,  1.90s/sample]\rGenerating predictions:  44%|████▎     | 435/1000 [15:09<15:18,  1.62s/sample]\rGenerating predictions:  44%|████▍     | 440/1000 [15:21<16:55,  1.81s/sample]\rGenerating predictions:  44%|████▍     | 445/1000 [15:35<19:35,  2.12s/sample]\rGenerating predictions:  45%|████▌     | 450/1000 [15:51<22:27,  2.45s/sample]\rGenerating predictions:  46%|████▌     | 455/1000 [16:05<23:27,  2.58s/sample]\rGenerating predictions:  46%|████▌     | 460/1000 [16:13<20:31,  2.28s/sample]\rGenerating predictions:  46%|████▋     | 465/1000 [16:20<17:51,  2.00s/sample]\rGenerating predictions:  47%|████▋     | 470/1000 [16:35<20:13,  2.29s/sample]\rGenerating predictions:  48%|████▊     | 475/1000 [16:50<22:04,  2.52s/sample]\rGenerating predictions:  48%|████▊     | 480/1000 [17:00<20:06,  2.32s/sample]\rGenerating predictions:  48%|████▊     | 485/1000 [17:13<20:48,  2.43s/sample]\rGenerating predictions:  49%|████▉     | 490/1000 [17:20<18:08,  2.13s/sample]\rGenerating predictions:  50%|████▉     | 495/1000 [17:31<18:14,  2.17s/sample]\rGenerating predictions:  50%|█████     | 500/1000 [17:42<17:47,  2.14s/sample]\rGenerating predictions:  50%|█████     | 505/1000 [18:02<22:10,  2.69s/sample]\rGenerating predictions:  51%|█████     | 510/1000 [18:10<19:28,  2.39s/sample]\rGenerating predictions:  52%|█████▏    | 515/1000 [18:15<15:49,  1.96s/sample]\rGenerating predictions:  52%|█████▏    | 520/1000 [18:22<14:35,  1.82s/sample]\rGenerating predictions:  52%|█████▎    | 525/1000 [18:29<13:09,  1.66s/sample]\rGenerating predictions:  53%|█████▎    | 530/1000 [18:33<11:21,  1.45s/sample]\rGenerating predictions:  54%|█████▎    | 535/1000 [18:44<12:43,  1.64s/sample]\rGenerating predictions:  54%|█████▍    | 540/1000 [18:59<15:50,  2.07s/sample]\rGenerating predictions:  55%|█████▍    | 545/1000 [19:09<15:13,  2.01s/sample]\rGenerating predictions:  55%|█████▌    | 550/1000 [19:19<15:20,  2.05s/sample]\rGenerating predictions:  56%|█████▌    | 555/1000 [19:31<15:53,  2.14s/sample]\rGenerating predictions:  56%|█████▌    | 560/1000 [19:36<13:05,  1.78s/sample]\rGenerating predictions:  56%|█████▋    | 565/1000 [19:44<12:40,  1.75s/sample]\rGenerating predictions:  57%|█████▋    | 570/1000 [19:55<13:22,  1.87s/sample]\rGenerating predictions:  57%|█████▊    | 575/1000 [20:01<11:51,  1.67s/sample]\rGenerating predictions:  58%|█████▊    | 580/1000 [20:19<15:47,  2.25s/sample]\rGenerating predictions:  58%|█████▊    | 585/1000 [20:37<18:11,  2.63s/sample]\rGenerating predictions:  59%|█████▉    | 590/1000 [20:45<16:06,  2.36s/sample]\rGenerating predictions:  60%|█████▉    | 595/1000 [21:09<20:38,  3.06s/sample]\rGenerating predictions:  60%|██████    | 600/1000 [21:30<22:58,  3.45s/sample]\rGenerating predictions:  60%|██████    | 605/1000 [21:49<23:07,  3.51s/sample]\rGenerating predictions:  61%|██████    | 610/1000 [21:56<18:48,  2.89s/sample]\rGenerating predictions:  62%|██████▏   | 615/1000 [22:11<18:46,  2.93s/sample]\rGenerating predictions:  62%|██████▏   | 620/1000 [22:23<17:29,  2.76s/sample]\rGenerating predictions:  62%|██████▎   | 625/1000 [22:30<14:44,  2.36s/sample]\rGenerating predictions:  63%|██████▎   | 630/1000 [22:42<14:40,  2.38s/sample]\rGenerating predictions:  64%|██████▎   | 635/1000 [22:48<12:20,  2.03s/sample]\rGenerating predictions:  64%|██████▍   | 640/1000 [22:57<11:40,  1.94s/sample]\rGenerating predictions:  64%|██████▍   | 645/1000 [23:05<10:58,  1.85s/sample]\rGenerating predictions:  65%|██████▌   | 650/1000 [23:18<12:12,  2.09s/sample]\rGenerating predictions:  66%|██████▌   | 655/1000 [23:27<11:13,  1.95s/sample]\rGenerating predictions:  66%|██████▌   | 660/1000 [23:48<15:01,  2.65s/sample]\rGenerating predictions:  66%|██████▋   | 665/1000 [24:06<16:24,  2.94s/sample]\rGenerating predictions:  67%|██████▋   | 670/1000 [24:21<16:20,  2.97s/sample]\rGenerating predictions:  68%|██████▊   | 675/1000 [24:27<13:13,  2.44s/sample]\rGenerating predictions:  68%|██████▊   | 680/1000 [24:39<12:58,  2.43s/sample]\rGenerating predictions:  68%|██████▊   | 685/1000 [24:45<10:38,  2.03s/sample]\rGenerating predictions:  69%|██████▉   | 690/1000 [24:59<11:54,  2.30s/sample]\rGenerating predictions:  70%|██████▉   | 695/1000 [25:14<12:34,  2.47s/sample]\rGenerating predictions:  70%|███████   | 700/1000 [25:24<11:43,  2.34s/sample]\rGenerating predictions:  70%|███████   | 705/1000 [25:34<10:55,  2.22s/sample]\rGenerating predictions:  71%|███████   | 710/1000 [25:46<11:04,  2.29s/sample]\rGenerating predictions:  72%|███████▏  | 715/1000 [26:02<12:07,  2.55s/sample]\rGenerating predictions:  72%|███████▏  | 720/1000 [26:09<10:19,  2.21s/sample]\rGenerating predictions:  72%|███████▎  | 725/1000 [26:20<10:08,  2.21s/sample]\rGenerating predictions:  73%|███████▎  | 730/1000 [26:32<10:08,  2.25s/sample]\rGenerating predictions:  74%|███████▎  | 735/1000 [26:40<09:05,  2.06s/sample]\rGenerating predictions:  74%|███████▍  | 740/1000 [26:51<09:18,  2.15s/sample]\rGenerating predictions:  74%|███████▍  | 745/1000 [27:03<09:21,  2.20s/sample]\rGenerating predictions:  75%|███████▌  | 750/1000 [27:11<08:23,  2.02s/sample]\rGenerating predictions:  76%|███████▌  | 755/1000 [27:24<08:49,  2.16s/sample]\rGenerating predictions:  76%|███████▌  | 760/1000 [27:29<07:18,  1.83s/sample]\rGenerating predictions:  76%|███████▋  | 765/1000 [27:37<06:49,  1.74s/sample]\rGenerating predictions:  77%|███████▋  | 770/1000 [27:49<07:37,  1.99s/sample]\rGenerating predictions:  78%|███████▊  | 775/1000 [27:57<06:58,  1.86s/sample]\rGenerating predictions:  78%|███████▊  | 780/1000 [28:19<09:33,  2.61s/sample]\rGenerating predictions:  78%|███████▊  | 785/1000 [28:35<09:55,  2.77s/sample]\rGenerating predictions:  79%|███████▉  | 790/1000 [28:43<08:27,  2.42s/sample]\rGenerating predictions:  80%|███████▉  | 795/1000 [28:47<06:39,  1.95s/sample]\rGenerating predictions:  80%|████████  | 800/1000 [28:57<06:34,  1.97s/sample]\rGenerating predictions:  80%|████████  | 805/1000 [29:07<06:26,  1.98s/sample]\rGenerating predictions:  81%|████████  | 810/1000 [29:26<08:01,  2.53s/sample]\rGenerating predictions:  82%|████████▏ | 815/1000 [29:33<06:46,  2.20s/sample]\rGenerating predictions:  82%|████████▏ | 820/1000 [29:45<06:46,  2.26s/sample]\rGenerating predictions:  82%|████████▎ | 825/1000 [30:00<07:09,  2.45s/sample]\rGenerating predictions:  83%|████████▎ | 830/1000 [30:08<06:13,  2.19s/sample]\rGenerating predictions:  84%|████████▎ | 835/1000 [30:21<06:28,  2.35s/sample]\rGenerating predictions:  84%|████████▍ | 840/1000 [30:30<05:49,  2.18s/sample]\rGenerating predictions:  84%|████████▍ | 845/1000 [30:42<05:43,  2.22s/sample]\rGenerating predictions:  85%|████████▌ | 850/1000 [30:50<05:11,  2.08s/sample]\rGenerating predictions:  86%|████████▌ | 855/1000 [31:00<04:55,  2.04s/sample]\rGenerating predictions:  86%|████████▌ | 860/1000 [31:16<05:33,  2.38s/sample]\rGenerating predictions:  86%|████████▋ | 865/1000 [31:25<04:53,  2.17s/sample]\rGenerating predictions:  87%|████████▋ | 870/1000 [31:28<03:48,  1.76s/sample]\rGenerating predictions:  88%|████████▊ | 875/1000 [31:42<04:15,  2.05s/sample]\rGenerating predictions:  88%|████████▊ | 880/1000 [31:56<04:34,  2.29s/sample]\rGenerating predictions:  88%|████████▊ | 885/1000 [32:17<05:25,  2.83s/sample]\rGenerating predictions:  89%|████████▉ | 890/1000 [32:30<05:05,  2.78s/sample]\rGenerating predictions:  90%|████████▉ | 895/1000 [32:43<04:44,  2.71s/sample]\rGenerating predictions:  90%|█████████ | 900/1000 [32:51<03:59,  2.40s/sample]\rGenerating predictions:  90%|█████████ | 905/1000 [33:02<03:42,  2.35s/sample]\rGenerating predictions:  91%|█████████ | 910/1000 [33:18<03:52,  2.58s/sample]\rGenerating predictions:  92%|█████████▏| 915/1000 [33:24<03:05,  2.18s/sample]\rGenerating predictions:  92%|█████████▏| 920/1000 [33:32<02:38,  1.98s/sample]\rGenerating predictions:  92%|█████████▎| 925/1000 [33:48<02:58,  2.38s/sample]\rGenerating predictions:  93%|█████████▎| 930/1000 [33:54<02:19,  1.99s/sample]\rGenerating predictions:  94%|█████████▎| 935/1000 [34:03<02:07,  1.95s/sample]\rGenerating predictions:  94%|█████████▍| 940/1000 [34:22<02:30,  2.50s/sample]\rGenerating predictions:  94%|█████████▍| 945/1000 [34:29<01:59,  2.18s/sample]\rGenerating predictions:  95%|█████████▌| 950/1000 [34:41<01:52,  2.25s/sample]\rGenerating predictions:  96%|█████████▌| 955/1000 [34:50<01:35,  2.13s/sample]\rGenerating predictions:  96%|█████████▌| 960/1000 [34:55<01:09,  1.74s/sample]\rGenerating predictions:  96%|█████████▋| 965/1000 [35:06<01:06,  1.89s/sample]\rGenerating predictions:  97%|█████████▋| 970/1000 [35:17<01:00,  2.00s/sample]\rGenerating predictions:  98%|█████████▊| 975/1000 [35:37<01:04,  2.57s/sample]\rGenerating predictions:  98%|█████████▊| 980/1000 [35:56<00:59,  2.96s/sample]\rGenerating predictions:  98%|█████████▊| 985/1000 [36:00<00:34,  2.32s/sample]\rGenerating predictions:  99%|█████████▉| 990/1000 [36:12<00:23,  2.35s/sample]\rGenerating predictions: 100%|█████████▉| 995/1000 [36:21<00:10,  2.18s/sample]\rGenerating predictions: 100%|██████████| 1000/1000 [36:29<00:00,  1.97s/sample]\rGenerating predictions: 100%|██████████| 1000/1000 [36:29<00:00,  2.19s/sample]\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Results saved to /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/model_results/OpenMeditron_Meditron3-8B_20240823_174423.json\nCSV results saved to /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/model_results/OpenMeditron_Meditron3-8B_20240823_174423_results.csv\n\nTest Metrics (CSN level):\nAccuracy: 0.55\nPrecision: 0.61\nRecall: 0.82\nF1_score: 0.70\n"
     ]
    },
    {
     "output_type": "display_data",
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAxEAAAJwCAYAAAD2uOwtAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy88F64QAAAACXBIWXMAAA9hAAAPYQGoP6dpAABVr0lEQVR4nO3deZyN9f//8eeZGXOMYWYMxsxYxljHlkTJvmbNEipLRZQUPpaotNmKkj6VXSUkfNpEUeRjDSNS1iREFDO2xmQwlnn//vCb87mOGa65GDOj7+N+u53bzbmu97mu97mcc+a8zvP9vi6XMcYIAAAAADLIJ7s7AAAAAODWQhEBAAAAwBGKCAAAAACOUEQAAAAAcIQiAgAAAIAjFBEAAAAAHKGIAAAAAOAIRQQAAAAARygiAAAAADhCEYGbbs+ePWratKmCg4Plcrm0YMGCTN3+gQMH5HK5NHPmzEzd7q2sQYMGatCgQaZu89ChQ8qdO7fWrVuXqdu9mUqUKKHu3btndzckpe3LkiVLlDdvXh07diz7OgV1795dJUqU8Frmcrk0fPjwbOnPrYRjB/zfRhHxf8S+ffv0xBNPqGTJksqdO7eCgoJUu3ZtvfPOOzp79uxN3Xe3bt20fft2vfrqq5o9e7aqV69+U/eXlbp37y6Xy6WgoKB0j+OePXvkcrnkcrk0btw4x9s/fPiwhg8fri1btmRCb2/MyJEjVaNGDdWuXTvNulWrVql9+/YKDw+Xv7+/wsLC1Lp1a82fP9+r3bFjx9S/f3/FxMQoICBAYWFhuuuuu/Tss8/q9OnTnnapx/W2226TMSbN/lwul/r27Zv5TzILNW/eXKVLl9aYMWNu2j527typhx56SEWKFJHb7VZkZKS6du2qnTt33rR9Xo/UHwJcLpdeeeWVdNt07dpVLpdLefPmzeLeSevXr9fw4cOVkJCQ5ftOz1dffSUfHx/FxcVx7DLovffeU/369VW4cGG53W5FR0fr0Ucf1YEDBzK8jSNHjqhXr16Kjo5WQECASpUqpUGDBunEiRNe7Ro0aOD5P3G5XPL391d0dLR69eqlQ4cOZfIzA7KPX3Z3ADff4sWLdf/998vtduuRRx5RpUqVdP78ea1du1ZDhgzRzp079e67796UfZ89e1axsbF64YUXbtqXvqioKJ09e1a5cuW6Kdu34+fnpzNnzuirr77SAw884LVuzpw5yp07t86dO3dd2z58+LBGjBihEiVK6Pbbb8/w47799tvr2t/VHDt2TLNmzdKsWbPSrBs2bJhGjhypMmXK6IknnlBUVJROnDihr7/+Wh06dNCcOXPUpUsXnTx5UtWrV1diYqJ69OihmJgYnThxQtu2bdOUKVP05JNPpvmSs337ds2fP18dOnTI1OeTUzzxxBMaPHiwRowYoXz58mXqtufPn6/OnTsrNDRUPXv2VHR0tA4cOKDp06frs88+03/+8x/dd999mbrPG5U7d27NmzdPL774otfypKQkLVy4ULlz586Sfpw9e1Z+fv/787h+/XqNGDFC3bt3V0hISJb04VoWL16satWqKTw83PMlmGN3bT/99JOio6PVpk0b5c+fX/v379d7772nRYsWaevWrYqMjLzm40+fPq2aNWsqKSlJTz31lIoVK6atW7dq4sSJWrlypTZv3iwfn//9Llu0aFHPDwTnz5/Xzz//rKlTp2rp0qXatWuX8uTJc1OfL5AVKCL+4fbv369OnTopKipKK1asUEREhGddnz59tHfvXi1evPim7T91qMbN/OPhcrmy7A9ketxut2rXrq158+alKSLmzp2rVq1a6fPPP8+Svpw5c0Z58uSRv79/pm73o48+kp+fn1q3bu21/LPPPtPIkSPVsWNHzZ0716uQGzJkiJYuXaoLFy5IkqZPn66DBw9q3bp1qlWrltd2EhMT0/Q5ICBAxYoV08iRI9W+fXu5XK5MfU45QYcOHdSvXz99+umn6tGjR6Ztd9++fXr44YdVsmRJrVmzRoUKFfKs69+/v+rWrauHH35Y27ZtU8mSJTNtvzeqZcuWmj9/vrZu3aoqVap4li9cuFDnz59X8+bNtWLFipvejxv5PElJSdH58+dv6mfS119/neb1wrG7tsmTJ6dZ1q5dO1WvXl0ffvihnnvuuWs+/ssvv9Tvv/+uRYsWqVWrVp7loaGhGjlypLZu3aqqVat6lgcHB+uhhx7y2kZ0dLT69u2rdevW6Z577rnBZwRkP4Yz/cONHTtWp0+f1vTp070KiFSlS5dW//79PfcvXryoUaNGqVSpUnK73SpRooSef/55JScnez2uRIkSuvfee7V27Vrdddddyp07t0qWLKkPP/zQ02b48OGKioqSdPkLpcvl8oyfTW8sbepjrvyyuGzZMtWpU0chISHKmzevypUrp+eff96z/mpzIlasWKG6desqMDBQISEhatu2rXbt2pXu/vbu3ev5pSw4OFiPPvqozpw5c/UDe4UuXbrom2++8YrsN23apD179qhLly5p2p88eVKDBw9W5cqVlTdvXgUFBalFixbaunWrp82qVat05513SpIeffRRTzSe+jwbNGigSpUqafPmzapXr57y5MnjOS5Xzono1q2bcufOneb5N2vWTPnz59fhw4ev+fwWLFigGjVqpEkKXnrpJYWGhuqDDz5INwlq1qyZ7r33XkmXv9j6+vrq7rvvTtMuKCgozRcHHx8fvfjii9q2bZu++OKLa/bPiYSEBA0YMEDFihWT2+1W6dKl9frrryslJUWSdOHCBYWGhurRRx9N89jExETlzp1bgwcP9ixLTk7WsGHDVLp0abndbhUrVkzPPPNMmvdMesLCwnTbbbdp4cKFmfb8JOmNN97QmTNn9O6773oVEJJUsGBBTZs2TUlJSRo7dqxneep74ZdfftEDDzygoKAgFShQQP379083Sfvoo49UrVo1BQQEKDQ0VJ06dUozVCP1Nfrzzz+rYcOGypMnj4oUKeK1X6uaNWsqOjpac+fO9Vo+Z84cNW/eXKGhoek+7ptvvvG81/Ply6dWrVqlO2RrwYIFqlSpknLnzq1KlSpd9XVlHdc/fPhwDRkyRNLlL4Gp78PUBCB1aN2cOXNUsWJFud1uLVmyRNLlX79btGihoKAg5c2bV40bN9aGDRu89jVz5ky5XC6tW7dOgwYNUqFChRQYGKj77rsv3fky27dv16FDh7y+yHLsMnbsrpT6NygjQ60SExMlSYULF/Zanvp3NSAgwHYb4eHhkuSV1AC3NIN/tCJFipiSJUtmuH23bt2MJNOxY0czadIk88gjjxhJpl27dl7toqKiTLly5UzhwoXN888/byZOnGjuuOMO43K5zI4dO4wxxmzdutW89dZbRpLp3LmzmT17tvniiy88+4mKikqz/2HDhhnry3LHjh3G39/fVK9e3bzzzjtm6tSpZvDgwaZevXqeNvv37zeSzIwZMzzLli1bZvz8/EzZsmXN2LFjzYgRI0zBggVN/vz5zf79+9Psr2rVqqZ9+/Zm8uTJ5rHHHjOSzDPPPJOh4xUYGGgSExNN7ty5zfTp0z3rBgwYYGJiYjz9e+ONNzzrNm3aZEqVKmWee+45M23aNDNy5EhTpEgRExwcbP78809jjDFxcXFm5MiRRpLp1auXmT17tpk9e7bZt2+fMcaY+vXrm/DwcFOoUCHTr18/M23aNLNgwQLPuvr163v299dff5miRYuaO++801y8eNEYY8zUqVONJDN79uxrPsfz58+bgIAAM2jQIK/lv/76q5FkevToYXucjDFm9OjRRpKZOXOmbdvU43rx4kVTpkwZU6VKFZOSkuJZL8n06dPHdjtRUVGmW7dunvtJSUnmtttuMwUKFDDPP/+8mTp1qnnkkUeMy+Uy/fv397Tr0aOHCQkJMcnJyV7bmzVrlpFkNm3aZIwx5tKlS6Zp06YmT548ZsCAAWbatGmmb9++xs/Pz7Rt2/aafUn12GOPmYIFC9o+FyciIyNNiRIlrtmmRIkSpmjRop77qe+FypUrm9atW5uJEyeahx56yEgyDz/8sNdjX3nlFeNyucyDDz5oJk+e7Hl/lShRwvz111+edvXr1zeRkZGmWLFipn///mby5MmmUaNGRpL5+uuvPe2s75Hnn3/eFC9e3PP/fezYMePn52fmzZvneV1Yffjhh8blcpnmzZubCRMmmNdff92UKFHChISEeL3Xly5danx8fEylSpXMv//9b/PCCy+Y4OBgU7FixTSfRZLMsGHDjDGXP8c6d+5sJJm33nrL8z48ffq0p2358uVNoUKFzIgRI8ykSZPMTz/9ZHbs2GECAwNNRESEGTVqlHnttddMdHS0cbvdZsOGDZ59zZgxw/MZ1KhRIzNhwgTz9NNPG19fX/PAAw+k+X977bXXTFhYmOf4cOwyfuyMMeb48eMmPj7ebNq0ybRu3dpIMt9++226ba127txpfHx8TK1atUxsbKw5dOiQWbx4sSlatGiav4/169c3MTEx5tixY+bYsWPm8OHDZvny5aZixYqmdOnSaT5XgFsVRcQ/2KlTp4ykNF9mrmbLli1Gknnssce8lg8ePNhIMitWrPAsi4qKMpLMmjVrPMuOHj1q3G63efrppz3L0vsCbUzGi4jUIuTYsWNX7Xd6RcTtt99uwsLCzIkTJzzLtm7danx8fMwjjzySZn9XfhG+7777TIECBa66T+vzSP3D3LFjR9O4cWNjzOUvl+Hh4WbEiBHpHoNz586ZS5cupXkebrfbjBw50rNs06ZNaZ5bqvr16xtJZurUqemusxYRxlz+IiDJvPLKK+a3334zefPmTfPHLz179+41ksyECRO8li9cuNDz5SAj4uLiTKFChYwkExMTY3r37m3mzp1rEhIS0rS1HtfUL+7z58/3rL/eImLUqFEmMDDQ/Prrr17tnnvuOePr62sOHjxojPnfsfrqq6+82rVs2dKrKJ89e7bx8fEx3333nVe71AJt3bp1V+1LqtTiKj4+3vb5ZERCQkKG3vdt2rQxkkxiYqIx5n/vhTZt2ni1e+qpp4wks3XrVmOMMQcOHDC+vr7m1Vdf9Wq3fft24+fn57U89TX64YcfepYlJyeb8PBw06FDB88y63tkx44dRpLnmE6aNMnkzZvXJCUlpfki/Pfff5uQkBDz+OOPe/UlLi7OBAcHey2//fbbTUREhNfr7dtvvzWSrvlF2Bhj3njjDSPJ64u1ta2Pj4/ZuXOn1/J27doZf39/T9FvjDGHDx82+fLl8/oRJPWLcJMmTbwK5YEDBxpfX98074+6det6vY44dhk/dsYY43a7jSQjyRQoUMCMHz8+TZuref/9901ISIjn8ZJMt27dzIULF7zapb7ur7yVL1/e/PbbbxneH5DTMZzpHyw1fs3ohM2vv/5akjRo0CCv5U8//bQkpZk7UaFCBdWtW9dzv1ChQipXrpx+++236+7zlVLnUixcuNAz3MTOkSNHtGXLFnXv3t0rwr/tttt0zz33eJ6nVe/evb3u161bVydOnPAcw4zo0qWLVq1apbi4OK1YsUJxcXHpDmWSLs+jSJ2Ed+nSJZ04ccIzVOvHH3/M8D7dbne6w27S07RpUz3xxBOeOQa5c+fWtGnTbB+XeuaR/Pnzey13+voqXLiwtm7dqt69e+uvv/7S1KlT1aVLF4WFhWnUqFHpnoVJunxmmTJlymjkyJFXbZNRn376qerWrav8+fPr+PHjnluTJk106dIlrVmzRpLUqFEjFSxYUB9//LHnsX/99ZeWLVumBx980Gt75cuXV0xMjNf2GjVqJElauXKlbZ9Sj+vx48dv6Lml+vvvvyXZ/7+krr/yNd6nTx+v+/369ZP0v8+H+fPnKyUlRQ888IDXcw4PD1eZMmXSPOe8efN6jQ339/fXXXfdddXPiYoVK+q2227TvHnzJF2eV9S2bdt0J6IuW7ZMCQkJ6ty5s1dffH19VaNGDU9fUj8TunXrpuDgYM/j77nnHlWoUOGaxykj6tev77WdS5cu6dtvv1W7du285pxERESoS5cuWrt2bZrj3qtXL6+hnHXr1tWlS5f0+++/e5YlJCQoNjY2zVCmVBy7y9I7dqm++eYbff3113rzzTdVvHhxJSUlZbivRYoU0V133aW3335bX3zxhQYNGqQ5c+akO5+iRIkSWrZsmZYtW6ZvvvlGb7/9tk6dOqUWLVpwWmf8YzAw7x8sKChI0v++VNj5/fff5ePjo9KlS3stDw8PV0hISJoP5OLFi6fZRv78+fXXX39dZ4/TevDBB/X+++/rscce03PPPafGjRurffv26tixo9eZMK58HpJUrly5NOvKly+vpUuXKikpSYGBgZ7lVz6X1C92f/31l+c42mnZsqXy5cunjz/+WFu2bNGdd96p0qVLp3sKwZSUFL3zzjuaPHmy9u/fr0uXLnnWFShQIEP7ky7/UXMyiXrcuHFauHChtmzZorlz5yosLCzDj73yC7zT15d0+YvAlClTNHnyZO3Zs0dLly7V66+/rpdfflkRERF67LHH0jzG19dXL774orp166YFCxbc0BmF9uzZo23btqWZJ5Dq6NGjki6PWe7QoYPmzp2r5ORkud1uzZ8/XxcuXPAqIvbs2aNdu3bZbu9aUo/rtSaOnz17VqdOnfJaljq++kqpxYHd/8vVio0yZcp43S9VqpR8fHw8r+M9e/bIGJOmXaor58YULVo0zXPLnz+/tm3bdtW+denSRW+++aYGDhyo9evXe82BstqzZ48keYq2K6W+RlM/E9Lrs9PCPT3R0dFe948dO6YzZ85c9TMoJSVFhw4dUsWKFT3Lr/UZlGrp0qWSLv8gcDUcu/SPXaqGDRtKklq0aKG2bduqUqVKyps3r+fsgXFxcV7tg4ODFRAQoHXr1unee+/Vhg0bPKcpb9eunYKCgjRixAj16NHDqxgKDAxUkyZNPPebN2+uOnXqqHr16nrttdf05ptv2h8cIIejiPgHCwoKUmRkpHbs2OHocRk9C46vr2+6yzPya/HV9mH9Mi1dnqy2Zs0arVy5UosXL9aSJUv08ccfq1GjRvr222+v2genbuS5pHK73Wrfvr1mzZql33777ZoXXBo9erReeukl9ejRQ6NGjVJoaKh8fHw0YMCADCcuUsYm81n99NNPni+227dvV+fOnW0fk1rUXPkHOSYmxrMdp1wul8qWLauyZcuqVatWKlOmjObMmZNuESFdTiNGjRqlkSNHql27do73lyolJUX33HOPnnnmmXTXly1b1vPvTp06adq0afrmm2/Url07ffLJJ4qJifE6801KSooqV66sf//73+lur1ixYrZ9Sj2uBQsWvGqbjz/+OE3idLXXZnBwsCIiIq75JV2Stm3bpiJFitgWyVe+V1NSUuRyufTNN9+k+765cvL99by3OnfurKFDh+rxxx9XgQIFrvqlOfW9Mnv27HSLqqyawOr0fZiejBynr7/+WrVr1/ZKBK7Esfsfu8/vUqVKqWrVqpozZ46niLjyBCQzZsxQ9+7dNW3aNBUuXDjNdY7atGmj4cOHa/369bbJTLVq1RQcHOxJPIFbHUXEP9y9996rd999V7GxsapZs+Y120ZFRSklJUV79uxR+fLlPcvj4+OVkJDgOdNSZsifP3+6Z8RIL3728fFR48aN1bhxY/373//W6NGj9cILL2jlypVev/RYn4ck7d69O826X375RQULFvRKITJTly5d9MEHH8jHx0edOnW6arvPPvtMDRs21PTp072WJyQkeH2ZzMzTmiYlJenRRx9VhQoVVKtWLY0dO1b33Xef5wxQV1O8eHEFBARo//79XsvLli2rcuXKaeHChXrnnXeu+0JWJUuWVP78+XXkyJGrtklNI7p3735DZzIqVaqUTp8+ne7r5kr16tVTRESEPv74Y9WpU0crVqzQCy+8kGZ7W7duVePGja/7/2r//v0qWLDgVdMM6fJZrpYtW5bhbd5777167733tHbtWtWpUyfN+u+++04HDhzQE088kWbdnj17vH4d3rt3r1JSUjxnsilVqpSMMYqOjvYqujJT8eLFVbt2ba1atUpPPvnkVb/QlipVStLls1xd6/809TMh9dd3q/Q+J67k9P+2UKFCypMnz1U/g3x8fDJUYFoZY7RkyRKvM4Olh2PnzNmzZ73OpHbl+yw18YiPj0/zI5ckzymsL168mKH9Xbp0yevCmsCtjDkR/3DPPPOMAgMD9dhjjyk+Pj7N+n379umdd96RdHk4jiS9/fbbXm1Sf2W92jjc61GqVCmdOnXK69fSI0eOpDlt4MmTJ9M8NvWia1c7hWZERIRuv/12zZo1y6tQ2bFjh7799lvP87wZGjZsqFGjRmnixIlXHW4iXf5SfOWvZJ9++qn+/PNPr2WpxU5mXO312Wef1cGDBzVr1iz9+9//VokSJdStWzfbU5HmypVL1atX1w8//JBm3YgRI3TixAk99thj6f4R/fbbb7Vo0SJJ0vfff5/u+OONGzfqxIkT6Q5fsHrooYdUunRpjRgx4prtruWBBx5QbGysZ1iIVUJCgtdz8PHxUceOHfXVV19p9uzZunjxotdQptTt/fnnn3rvvffSbO/s2bMZGm+9efNm2wI/IiJCTZo08bpdy5AhQxQQEKAnnngizdV0T548qd69eytPnjye029aTZo0yev+hAkTJF0e/iFJ7du3l6+vr0aMGJHmNWyMSbO/6/XKK69o2LBhnjkZ6WnWrJmCgoI0evRoz5c5q9Sx59bPBOuwsGXLlunnn3+27YvT96Gvr6+aNm2qhQsXeg1njI+P19y5c1WnTp0MD5NMtWnTJh09ejRDn8McO28XL15Md2jTxo0btX37dq904cr3WWoyUbZsWcXHx2vVqlVe20idf2K9RsTVrFy5UqdPn/ZKM4FbGUnEP1ypUqU0d+5cPfjggypfvrzXFavXr1+vTz/9VN27d5ckValSRd26ddO7776rhIQE1a9fXxs3btSsWbPUrl07z1jSzNCpUyc9++yzuu+++/Svf/1LZ86c0ZQpU1S2bFmvMbYjR47UmjVr1KpVK0VFReno0aOaPHmyihYtmu4vrKneeOMNtWjRQjVr1lTPnj119uxZTZgwQcHBwdccZnSjUq9tYOfee+/VyJEj9eijj6pWrVravn275syZk+bCX6VKlVJISIimTp2qfPnyKTAwUDVq1EgzjtjOihUrNHnyZA0bNkx33HGHpMsxfYMGDfTSSy9d9bz9qdq2basXXnhBiYmJXn/AH3zwQW3fvl2vvvqqfvrpJ3Xu3NlzxeolS5Zo+fLlnvPWz549W3PmzNF9992natWqyd/fX7t27dIHH3yg3LlzX3XsdipfX1+98MILGZ5Inp4hQ4boyy+/1L333qvu3burWrVqSkpK0vbt2/XZZ5/pwIEDXknQgw8+qAkTJmjYsGGqXLmyV0InSQ8//LA++eQT9e7dWytXrlTt2rV16dIl/fLLL/rkk0+0dOnSNMMfrI4ePapt27almcx8o8qUKaNZs2apa9euqly5cporVh8/flzz5s3z/BpttX//frVp00bNmzdXbGysPvroI3Xp0sXzxadUqVJ65ZVXNHToUB04cEDt2rVTvnz5tH//fn3xxRfq1auX7a/lGVG/fn3Vr1//mm2CgoI0ZcoUPfzww7rjjjvUqVMnFSpUSAcPHtTixYtVu3ZtTZw4UZI0ZswYtWrVSnXq1FGPHj108uRJTZgwQRUrVrT9ZbhatWqSpBdeeEGdOnVSrly51Lp162smmq+88ornGjdPPfWU/Pz8NG3aNCUnJ9u+39KzePFilShRIkOTmTl23k6fPq1ixYrpwQcfVMWKFRUYGKjt27drxowZCg4O1ksvvWS7jb59+2rGjBlq3bq1+vXrp6ioKK1evVrz5s3TPffcoxo1ani1P3XqlD766CNJl4uY3bt3a8qUKQoICLC9sB1wy8j6E0IhO/z666/m8ccfNyVKlDD+/v4mX758pnbt2mbChAnm3LlznnYXLlwwI0aMMNHR0SZXrlymWLFiZujQoV5tjLl8uspWrVql2c+Vpxa92ilejbl8isBKlSoZf39/U65cOfPRRx+lOcXr8uXLTdu2bU1kZKTx9/c3kZGRpnPnzl6n6EzvFK/GGPPf//7X1K5d2wQEBJigoCDTunVr8/PPP3u1Sd3flaeQTT11YHqnJbRK79zrV7raKV6ffvppExERYQICAkzt2rVNbGxsuqdmXbhwoalQoYLx8/Pzep7169c3FStWTHef1u0kJiaaqKgoc8cdd6Q5FeHAgQONj4+PiY2NveZziI+PN35+fle9pkTq/1NYWJjx8/MzhQoVMq1btzYLFy70tNm2bZsZMmSIueOOO0xoaKjx8/MzERER5v777zc//vij1/audlwvXLhgSpUqdd2neDXm8qkthw4dakqXLm38/f1NwYIFTa1atcy4cePM+fPnvdqmpKSYYsWKeU6Nm57z58+b119/3VSsWNG43W6TP39+U61aNTNixAhz6tSpa/ZlypQpJk+ePJ7TrGa2bdu2mc6dO5uIiAiTK1cuEx4ebjp37my2b9+epm3qe+Hnn382HTt2NPny5TP58+c3ffv2NWfPnk3T/vPPPzd16tQxgYGBJjAw0MTExJg+ffqY3bt3e9pc7TV65Smer/U5ceXj0ntdrFy50jRr1swEBweb3Llzm1KlSpnu3bubH374IU2fy5cvb9xut6lQoYKZP39+uqeb1hWnKTXm8umBixQpYnx8fLw+G671Wvzxxx9Ns2bNTN68eU2ePHlMw4YNzfr1673apH7WpF57xPqcJJmVK1caY4ypXr26eeqpp9Lsg2Nnf+ySk5NN//79zW233WaCgoJMrly5TFRUlOnZs6ftZ7zVL7/8Yjp27GiKFSvm2cbgwYNNUlKSV7srT/HqcrlMaGioadOmjdm8eXOG9wfkdC5jbvCciQD+T+jZs6d+/fVXfffdd9ndlX+MqlWrqkGDBnrrrbeyuysaPny4RowYoWPHjl1zkjeyXnx8vCIiIrRo0aKbOhwTAJxgOBOADBk2bJjKli2rdevWqXbt2tndnVvekiVLPKe5Ba7l1KlTevnllzN1SCkA3CiKCAAZUrx4cZ07dy67u/GP0bx5c87SggwpW7bsTZ3LBQDXg7MzAQAAAHCEOREAAAAAHCGJAAAAAOAIRQQAAAAARygiAAAAADjyjzw707mL2d0DAMhcLSatz+4uAECmWtm/VnZ34aoCqvbNsn2d/Wlilu0rM5FEAAAAAHDkH5lEAAAAANfNxe/sdjhCAAAAABwhiQAAAACsXK7s7kGORxIBAAAAwBGSCAAAAMCKORG2OEIAAAAAHCGJAAAAAKyYE2GLJAIAAACAIyQRAAAAgBVzImxxhAAAAAA4QhIBAAAAWDEnwhZJBAAAAABHSCIAAAAAK+ZE2OIIAQAAAHCEIgIAAACAIwxnAgAAAKyYWG2LJAIAAACAIyQRAAAAgBUTq21xhAAAAAA4QhIBAAAAWDEnwhZJBAAAAABHSCIAAAAAK+ZE2OIIAQAAAHCEJAIAAACwYk6ELZIIAAAAAI6QRAAAAABWzImwxRECAAAA4AhJBAAAAGBFEmGLIwQAAADAEZIIAAAAwMqHszPZIYkAAAAA4AhJBAAAAGDFnAhbHCEAAAAAjlBEAAAAAHCE4UwAAACAlYuJ1XZIIgAAAAA4QhIBAAAAWDGx2hZHCAAAAIAjJBEAAACAFXMibJFEAAAAAHCEJAIAAACwYk6ELY4QAAAAAEdIIgAAAAAr5kTYIokAAAAA4AhJBAAAAGDFnAhbHCEAAAAAjpBEAAAAAFbMibBFEgEAAADAEZIIAAAAwIo5EbY4QgAAAAAcIYkAAAAArJgTYYskAgAAAIAjJBEAAACAFXMibHGEAAAAADhCEQEAAADAEYYzAQAAAFYMZ7LFEQIAAADgCEkEAAAAYMUpXm2RRAAAAABwhCQCAAAAsGJOhC2OEAAAAABHSCIAAAAAK+ZE2CKJAAAAAOAISQQAAABgxZwIWxwhAAAAAI6QRAAAAABWzImwRRIBAAAAwBGSCAAAAMDCRRJhiyQCAAAAgCMkEQAAAIAFSYQ9kggAAAAAjpBEAAAAAFYEEbZIIgAAAAA4QhEBAAAAwBGGMwEAAAAWTKy2RxIBAAAAwBGSCAAAAMCCJMIeSQQAAAAAR0giAAAAAAuSCHskEQAAAAAcIYkAAAAALEgi7JFEAAAAAHCEJAIAAACwIoiwRRIBAAAAwBGSCAAAAMCCORH2SCIAAACAW8CYMWN05513Kl++fAoLC1O7du20e/durzYNGjSQy+XyuvXu3durzcGDB9WqVSvlyZNHYWFhGjJkiC5evOioLyQRAAAAgEVOTSJWr16tPn366M4779TFixf1/PPPq2nTpvr5558VGBjoaff4449r5MiRnvt58uTx/PvSpUtq1aqVwsPDtX79eh05ckSPPPKIcuXKpdGjR2e4LxQRAAAAwC1gyZIlXvdnzpypsLAwbd68WfXq1fMsz5Mnj8LDw9Pdxrfffquff/5Z//3vf1W4cGHdfvvtGjVqlJ599lkNHz5c/v7+GeoLw5kAAAAAiyuHA93MW3JyshITE71uycnJGernqVOnJEmhoaFey+fMmaOCBQuqUqVKGjp0qM6cOeNZFxsbq8qVK6tw4cKeZc2aNVNiYqJ27tyZ4WNEEQEAAABkkzFjxig4ONjrNmbMGNvHpaSkaMCAAapdu7YqVarkWd6lSxd99NFHWrlypYYOHarZs2froYce8qyPi4vzKiAkee7HxcVluN8MZwIAAAAssnJOxNChQzVo0CCvZW632/Zxffr00Y4dO7R27Vqv5b169fL8u3LlyoqIiFDjxo21b98+lSpVKnM6LZIIAAAAINu43W4FBQV53eyKiL59+2rRokVauXKlihYtes22NWrUkCTt3btXkhQeHq74+HivNqn3rzaPIj0UEQAAAICVKwtvDhhj1LdvX33xxRdasWKFoqOjbR+zZcsWSVJERIQkqWbNmtq+fbuOHj3qabNs2TIFBQWpQoUKGe4Lw5kAAACAW0CfPn00d+5cLVy4UPny5fPMYQgODlZAQID27dunuXPnqmXLlipQoIC2bdumgQMHql69errtttskSU2bNlWFChX08MMPa+zYsYqLi9OLL76oPn36ZGgYVSqSCAAAAOAWMGXKFJ06dUoNGjRQRESE5/bxxx9Lkvz9/fXf//5XTZs2VUxMjJ5++ml16NBBX331lWcbvr6+WrRokXx9fVWzZk099NBDeuSRR7yuK5ERJBEAAACARU692Jwx5prrixUrptWrV9tuJyoqSl9//fUN9YUkAgAAAIAjJBEAAACARU5NInISkggAAAAAjpBEAAAAABYkEfZIIgAAAAA4QhIBAAAAWBFE2CKJAAAAAOAISQQAAABgwZwIeyQRAAAAABwhiQAAAAAsSCLskUQAAAAAcIQkAgAAALAgibBHEgEAAADAEZIIAAAAwIIkwh5JBAAAAABHSCIAAAAAK4IIWyQRAAAAAByhiAAAAADgCMOZAAAAAAsmVtsjiQAAAADgCEkEAAAAYEESYY8kAgAAAIAjJBEAAACABUmEPZIIAAAAAI6QRAAAAABWBBG2SCIAAAAAOEISAQAAAFgwJ8IeSQQAAAAAR0giAAAAAAuSCHskEQAAAAAcIYkAAAAALEgi7FFEADY2/7BJMz+Yrl0/79CxY8f01vhJatS4iWf9S88/py8XfuH1mFq162jKu9OzuqsAkK7bIoP0YLVIlQ3Lq4J5/fXiV79o3W8nPevz58mlXrWjVL14iPK6fbXtz0SNX71ffyacS3d7r7Utrxol8qfZDoD/OygiABtnz55RuXLl1K59Bw3q3zfdNrXr1NXIV8Z47vv7+2dV9wDAVu5cPtp3PEnf/HxUo+6NSbN+1L0xupiSohcX/aIzyRd1/x2RGndfRT06+yedu5ji1bZj1QiZrOo4kE1IIuxRRAA26tStrzp161+zjb+/vwoWKpRFPQIAZzb+nqCNvyeku65oSG5VjMinR2f/pAMnz0qS3lrxmz5//E41KldQX+886mlbqmAePVA1Uk/8Z5vmP35nVnQdQA6VrUXE8ePH9cEHHyg2NlZxcXGSpPDwcNWqVUvdu3dXIb6U4Rbxw6aNalC3poKCgnRXjbvV918DFBKSP7u7BQC2cvlePsfK+Uv/SxyMpAuXUlQ5MshTRLj9fPRi87J6Z9Vv+uvMhezoKpB1CCJsZdvZmTZt2qSyZctq/PjxCg4OVr169VSvXj0FBwdr/PjxiomJ0Q8//GC7neTkZCUmJnrdkpOTs+AZAJfVqlNXr4x+Xe9Nn6kBg4Zo86ZNeuqJx3Xp0qXs7hoA2Dr411nFJSbr8VpRyuv2lZ+PS52qFVFYPrcKBObytOtTr4R2Hvlb6377Kxt7CyCnyLYkol+/frr//vs1derUNOPOjDHq3bu3+vXrp9jY2GtuZ8yYMRoxYoTXshdeGqYXXx6e2V0G0tWiZSvPv8uULaeyZcupVfMm+mHTRtW4u2Y29gwA7F1KMRq2+BcNaVJaX/WuoUspRpsPJmjDgb88P8bWis6vqsWC9fjcrdnaVyCrMCfCXrYVEVu3btXMmTPT/U9yuVwaOHCgqlatarudoUOHatCgQV7LjK870/oJOFW0WDHlz59fBw/+ThEB4Jbw69EkPT53qwL9feXn69Kpsxc1+cHK2h1/WpJUtViwIoNza1HvGl6PG9GqnLYfTtTAz3dmR7cBZKNsKyLCw8O1ceNGxcSkPUuEJG3cuFGFCxe23Y7b7Zbb7V00nLuYKV0Erkt8XJwSEhJUqCBzegDcWpLOXx6GWSQkt8qG5dUHsQclSXN/+FOLLROsJWnGQ7dr8pr9Wr+f4U3A/0XZVkQMHjxYvXr10ubNm9W4cWNPwRAfH6/ly5frvffe07hx47Kre4DHmaQkHTx40HP/zz/+0C+7dik4OFjBwcGaOmWimtzTTAUKFtQfhw7prTffULHiUapVp2429hoA/id3Lh8VCc7tuR8R7Fapgnn0d/JFHf37vOqXLqCEsxd09O9klSyYR33rR2vdbyf1w8FTkqS/zlxIdzJ1/N/nFZfIPET88zCcyV62FRF9+vRRwYIF9dZbb2ny5MmeSai+vr6qVq2aZs6cqQceeCC7ugd47Ny5Q489+ojn/rixl68H0abtfXrh5eH6dfev+nLhAv2d+LfCwsJUs1Zt9enXn2tFAMgxyoXl1dsdK3nu96kXLUla8vNRvb5srwoE5tJT9Uoof55cOpF0Qd/uOqrZG//Iru4CuAW4jDHZfs2YCxcu6Pjx45KkggULKleuXDaPuDaGMwH4p2kxaX12dwEAMtXK/rWyuwtXVXrwN1m2r73jWmTZvjJTjrjYXK5cuRQREZHd3QAAAACQATmiiAAAAAByCuZE2Mu2i80BAAAAuDWRRAAAAAAWBBH2SCIAAAAAOEISAQAAAFgwJ8IeSQQAAAAAR0giAAAAAAuCCHskEQAAAAAcIYkAAAAALHx8iCLskEQAAAAAcIQkAgAAALBgToQ9kggAAAAAjpBEAAAAABZcJ8IeSQQAAAAARygiAAAAADjCcCYAAADAgtFM9kgiAAAAADhCEgEAAABYMLHaHkkEAAAAAEdIIgAAAAALkgh7JBEAAAAAHCGJAAAAACwIIuyRRAAAAABwhCQCAAAAsGBOhD2SCAAAAACOkEQAAAAAFgQR9kgiAAAAADhCEgEAAABYMCfCHkkEAAAAAEdIIgAAAAALggh7JBEAAAAAHCGJAAAAACyYE2GPJAIAAACAIyQRAAAAgAVBhD2SCAAAAACOUEQAAAAAcIThTAAAAIAFE6vtkUQAAAAAcIQkAgAAALAgiLBHEgEAAADAEZIIAAAAwII5EfZIIgAAAIBbwJgxY3TnnXcqX758CgsLU7t27bR7926vNufOnVOfPn1UoEAB5c2bVx06dFB8fLxXm4MHD6pVq1bKkyePwsLCNGTIEF28eNFRXygiAAAAAAuXK+tuTqxevVp9+vTRhg0btGzZMl24cEFNmzZVUlKSp83AgQP11Vdf6dNPP9Xq1at1+PBhtW/f3rP+0qVLatWqlc6fP6/169dr1qxZmjlzpl5++WVnx8gYY5x1P+c756yQAoAcr8Wk9dndBQDIVCv718ruLlxVrbFrsmxf65+pd92PPXbsmMLCwrR69WrVq1dPp06dUqFChTR37lx17NhRkvTLL7+ofPnyio2N1d13361vvvlG9957rw4fPqzChQtLkqZOnapnn31Wx44dk7+/f4b2TRIBAAAAWLhcriy7JScnKzEx0euWnJycoX6eOnVKkhQaGipJ2rx5sy5cuKAmTZp42sTExKh48eKKjY2VJMXGxqpy5cqeAkKSmjVrpsTERO3cuTPDx4giAgAAAMgmY8aMUXBwsNdtzJgxto9LSUnRgAEDVLt2bVWqVEmSFBcXJ39/f4WEhHi1LVy4sOLi4jxtrAVE6vrUdRnF2ZkAAAAAi6w8OdPQoUM1aNAgr2Vut9v2cX369NGOHTu0du3am9W1a6KIAAAAALKJ2+3OUNFg1bdvXy1atEhr1qxR0aJFPcvDw8N1/vx5JSQkeKUR8fHxCg8P97TZuHGj1/ZSz96U2iYjGM4EAAAAWGTlnAgnjDHq27evvvjiC61YsULR0dFe66tVq6ZcuXJp+fLlnmW7d+/WwYMHVbNmTUlSzZo1tX37dh09etTTZtmyZQoKClKFChUy3BeSCAAAAOAW0KdPH82dO1cLFy5Uvnz5PHMYgoODFRAQoODgYPXs2VODBg1SaGiogoKC1K9fP9WsWVN33323JKlp06aqUKGCHn74YY0dO1ZxcXF68cUX1adPH0eJCEUEAAAAYJFTr1g9ZcoUSVKDBg28ls+YMUPdu3eXJL311lvy8fFRhw4dlJycrGbNmmny5Mmetr6+vlq0aJGefPJJ1axZU4GBgerWrZtGjhzpqC9cJwIAbgFcJwLAP01Ovk5EvX+vy7J9rRlUO8v2lZlIIgAAAACLHBpE5ChMrAYAAADgCEUEAAAAAEcYzgQAAABY5NSJ1TkJSQQAAAAAR0giAAAAAAuCCHskEQAAAAAcIYkAAAAALJgTYY8kAgAAAIAjJBEAAACABUGEPZIIAAAAAI6QRAAAAAAWPkQRtkgiAAAAADhCEgEAAABYEETYI4kAAAAA4AhJBAAAAGDBdSLskUQAAAAAcIQkAgAAALDwIYiwRRIBAAAAwBGSCAAAAMCCORH2SCIAAAAAOEISAQAAAFgQRNgjiQAAAADgCEUEAAAAAEcYzgQAAABYuMR4JjskEQAAAAAcIYkAAAAALLjYnD2SCAAAAACOkEQAAAAAFlxszh5JBAAAAABHSCIAAAAAC4IIeyQRAAAAABwhiQAAAAAsfIgibJFEAAAAAHCEJAIAAACwIIiwRxIBAAAAwBGSCAAAAMCC60TYI4kAAAAA4AhJBAAAAGBBEGGPJAIAAACAIyQRAAAAgAXXibBHEgEAAADAEYoIAAAAAI4wnAkAAACwYDCTPZIIAAAAAI6QRAAAAAAWXGzOHkkEAAAAAEdIIgAAAAALH4IIWyQRAAAAABwhiQAAAAAsmBNhjyQCAAAAgCMkEQAAAIAFQYQ9kggAAAAAjpBEAAAAABbMibBHEgEAAADAEZIIAAAAwILrRNgjiQAAAADgCEkEAAAAYMGcCHsZKiK+/PLLDG+wTZs2190ZAAAAADlfhoqIdu3aZWhjLpdLly5dupH+AAAAANmKHMJehoqIlJSUm90PAAAAALcI5kQAAAAAFj7MibB1XUVEUlKSVq9erYMHD+r8+fNe6/71r39lSscAAAAA5EyOi4iffvpJLVu21JkzZ5SUlKTQ0FAdP35cefLkUVhYGEUEAAAA8A/n+DoRAwcOVOvWrfXXX38pICBAGzZs0O+//65q1app3LhxN6OPAAAAQJZxubLudqtyXERs2bJFTz/9tHx8fOTr66vk5GQVK1ZMY8eO1fPPP38z+ggAAAAgB3FcROTKlUs+PpcfFhYWpoMHD0qSgoODdejQocztHQAAAJDFXC5Xlt1uVY7nRFStWlWbNm1SmTJlVL9+fb388ss6fvy4Zs+erUqVKt2MPgIAAADIQRwnEaNHj1ZERIQk6dVXX1X+/Pn15JNP6tixY3r33XczvYMAAABAVmJOhD3HSUT16tU9/w4LC9OSJUsytUMAAAAAcjYuNgcAAABYcLE5e46LiOjo6GtOAvntt99uqEMAAAAAcjbHRcSAAQO87l+4cEE//fSTlixZoiFDhmRWvwAAAIBsQRBhz3ER0b9//3SXT5o0ST/88MMNdwgAAABAzub47ExX06JFC33++eeZtTkAAAAgW3CdCHuZVkR89tlnCg0NzazNAQAAAMihrutic9aqyRijuLg4HTt2TJMnT87Uzl2vvXGns7sLAJCpNsycm91dAIDM1b9WdvfgqjLtV/Z/MMdFRNu2bb2KCB8fHxUqVEgNGjRQTExMpnYOAAAAQM7juIgYPnz4TegGAAAAkDPcynMVsorjtMbX11dHjx5Ns/zEiRPy9fXNlE4BAAAAyLkcJxHGmHSXJycny9/f/4Y7BAAAAGQnH4IIWxkuIsaPHy/pcrzz/vvvK2/evJ51ly5d0po1a5gTAQAAAPwfkOEi4q233pJ0OYmYOnWq19Alf39/lShRQlOnTs38HgIAAADIUTJcROzfv1+S1LBhQ82fP1/58+e/aZ0CAAAAsgvDmew5nhOxcuXKm9EPAAAAALcIx2dn6tChg15//fU0y8eOHav7778/UzoFAAAAZBeXy5VlNyfWrFmj1q1bKzIyUi6XSwsWLPBa37179zTbb968uVebkydPqmvXrgoKClJISIh69uyp06edX6jZcRGxZs0atWzZMs3yFi1aaM2aNY47AAAAAMBeUlKSqlSpokmTJl21TfPmzXXkyBHPbd68eV7ru3btqp07d2rZsmVatGiR1qxZo169ejnui+PhTKdPn073VK65cuVSYmKi4w4AAAAAOUlOnRPRokULtWjR4ppt3G63wsPD0123a9cuLVmyRJs2bVL16tUlSRMmTFDLli01btw4RUZGZrgvjpOIypUr6+OPP06z/D//+Y8qVKjgdHMAAADA/1nJyclKTEz0uiUnJ1/39latWqWwsDCVK1dOTz75pE6cOOFZFxsbq5CQEE8BIUlNmjSRj4+Pvv/+e0f7cZxEvPTSS2rfvr327dunRo0aSZKWL1+uuXPn6rPPPnO6OQAAACBHcThV4YaMGTNGI0aM8Fo2bNgwDR8+3PG2mjdvrvbt2ys6Olr79u3T888/rxYtWig2Nla+vr6Ki4tTWFiY12P8/PwUGhqquLg4R/tyXES0bt1aCxYs0OjRo/XZZ58pICBAVapU0YoVKxQaGup0cwAAAMD/WUOHDtWgQYO8lrnd7uvaVqdOnTz/rly5sm677TaVKlVKq1atUuPGjW+on1dyXERIUqtWrdSqVStJUmJioubNm6fBgwdr8+bNunTpUqZ2EAAAAMhKPlkYRbjd7usuGuyULFlSBQsW1N69e9W4cWOFh4fr6NGjXm0uXryokydPXnUexdU4nhORas2aNerWrZsiIyP15ptvqlGjRtqwYcP1bg4AAABAJvrjjz904sQJRURESJJq1qyphIQEbd682dNmxYoVSklJUY0aNRxt21ESERcXp5kzZ2r69OlKTEzUAw88oOTkZC1YsIBJ1QAAAPhHuO5f2W+y06dPa+/evZ77+/fv15YtWxQaGqrQ0FCNGDFCHTp0UHh4uPbt26dnnnlGpUuXVrNmzSRJ5cuXV/PmzfX4449r6tSpunDhgvr27atOnTo5OjOT5OAYtW7dWuXKldO2bdv09ttv6/Dhw5owYYKjnQEAAAC4Pj/88IOqVq2qqlWrSpIGDRqkqlWr6uWXX5avr6+2bdumNm3aqGzZsurZs6eqVaum7777zmu41Jw5cxQTE6PGjRurZcuWqlOnjt59913HfclwEvHNN9/oX//6l5588kmVKVPG8Y4AAACAW0FWnp3JiQYNGsgYc9X1S5cutd1GaGio5s6de8N9yXASsXbtWv3999+qVq2aatSooYkTJ+r48eM33AEAAAAAt5YMFxF333233nvvPR05ckRPPPGE/vOf/ygyMlIpKSlatmyZ/v7775vZTwAAACBL+LhcWXa7VTmeNxIYGKgePXpo7dq12r59u55++mm99tprCgsLU5s2bW5GHwEAAADkIDc0+bxcuXIaO3as/vjjD82bNy+z+gQAAABkG5cr6263qkw5g5Wvr6/atWunL7/8MjM2BwAAACAHu64rVgMAAAD/VD63cEKQVXLqtTQAAAAA5FAUEQAAAAAcYTgTAAAAYHErn3o1q5BEAAAAAHCEJAIAAACwIIiwRxIBAAAAwBGSCAAAAMCCU7zaI4kAAAAA4AhJBAAAAGDhElGEHZIIAAAAAI6QRAAAAAAWzImwRxIBAAAAwBGSCAAAAMCCJMIeSQQAAAAAR0giAAAAAAsXl6y2RRIBAAAAwBGSCAAAAMCCORH2SCIAAAAAOEISAQAAAFgwJcIeSQQAAAAARygiAAAAADjCcCYAAADAwofxTLZIIgAAAAA4QhIBAAAAWHCKV3skEQAAAAAcIYkAAAAALJgSYY8kAgAAAIAjJBEAAACAhY+IIuyQRAAAAABwhCQCAAAAsGBOhD2SCAAAAACOkEQAAAAAFlwnwh5JBAAAAABHSCIAAAAACx8mRdgiiQAAAADgCEkEAAAAYEEQYY8kAgAAAIAjJBEAAACABXMi7JFEAAAAAHCEJAIAAACwIIiwRxIBAAAAwBGKCAAAAACOMJwJAAAAsOBXdnscIwAAAACOkEQAAAAAFi5mVtsiiQAAAADgCEkEAAAAYEEOYY8kAgAAAIAjJBEAAACAhQ9zImyRRAAAAABwhCQCAAAAsCCHsEcSAQAAAMARkggAAADAgikR9kgiAAAAADhCEgEAAABYcMVqeyQRAAAAABwhiQAAAAAs+JXdHscIAAAAgCMkEQAAAIAFcyLskUQAAAAAcIQiAgAAAIAjDGcCAAAALBjMZI8kAgAAAIAjJBEAAACABROr7ZFEAAAAAHCEJAIAAACw4Fd2exwjAAAAAI6QRAAAAAAWzImwRxIBAAAAwBGSCAAAAMCCHMIeSQQAAAAAR0giAAAAAAumRNgjiQAAAADgCEkEAAAAYOHDrAhbJBEAAAAAHCGJAAAAACyYE2GPJAIAAACAIyQRAAAAgIWLORG2SCIAAACAW8CaNWvUunVrRUZGyuVyacGCBV7rjTF6+eWXFRERoYCAADVp0kR79uzxanPy5El17dpVQUFBCgkJUc+ePXX69GnHfaGIAAAAACxcrqy7OZGUlKQqVapo0qRJ6a4fO3asxo8fr6lTp+r7779XYGCgmjVrpnPnznnadO3aVTt37tSyZcu0aNEirVmzRr169XJ8jBjOBAAAANwCWrRooRYtWqS7zhijt99+Wy+++KLatm0rSfrwww9VuHBhLViwQJ06ddKuXbu0ZMkSbdq0SdWrV5ckTZgwQS1bttS4ceMUGRmZ4b6QRAAAAADZJDk5WYmJiV635ORkx9vZv3+/4uLi1KRJE8+y4OBg1ahRQ7GxsZKk2NhYhYSEeAoISWrSpIl8fHz0/fffO9ofRQQAAABg4SNXlt3GjBmj4OBgr9uYMWMc9zkuLk6SVLhwYa/lhQsX9qyLi4tTWFiY13o/Pz+FhoZ62mQUw5kAAACAbDJ06FANGjTIa5nb7c6m3mQcRQQAAABgkZUXm3O73ZlSNISHh0uS4uPjFRER4VkeHx+v22+/3dPm6NGjXo+7ePGiTp486Xl8RjGcCQAAALjFRUdHKzw8XMuXL/csS0xM1Pfff6+aNWtKkmrWrKmEhARt3rzZ02bFihVKSUlRjRo1HO2PJAIAAACwyMokwonTp09r7969nvv79+/Xli1bFBoaquLFi2vAgAF65ZVXVKZMGUVHR+ull15SZGSk2rVrJ0kqX768mjdvrscff1xTp07VhQsX1LdvX3Xq1MnRmZkkiggAAADglvDDDz+oYcOGnvupcym6deummTNn6plnnlFSUpJ69eqlhIQE1alTR0uWLFHu3Lk9j5kzZ4769u2rxo0by8fHRx06dND48eMd98VljDE3/pRylh1/OL/qHgDkZHe2fi67uwAAmersTxOzuwtXtWzX8Szb1z3lC2bZvjITcyIAAAAAOMJwJgAAAMDCJ4fOichJSCIAAAAAOEISAQAAAFi4RBRhhyQCAAAAgCMkEQAAAIBFTr1ORE5CEgEAAADAEZIIAAAAwII5EfZIIgAAAAA4QhIBAAAAWHCdCHskEQAAAAAcoYgAAAAA4AjDmQAAAAALJlbbI4kAAAAA4AhJBAAAAGDBxebsUUQANk4cO6qP3huvHzeu1/nkcwovUlR9hgxX6XIVJEkdGldL93EP9+qvdg8+kpVdBYA0BvdoqnaNqqhsicI6m3xB32/9TS+8s1B7fj/qaRNdtKBeG3ifalYtKXcuPy1bv0uDXv9UR0/+7WlTuniYRg9sp5pVSso/l6927DmsEZMXac0Pe7LjaQHIZhQRwDWc/jtRL/TvoUq3V9eLr41XUHB+HfnzoPLmy+dp8/6nS70e89PG9Zo8bqTurtsoq7sLAGnUvaO0pn68Rpt3/i4/P1+N6Ntai6b0VdX2r+jMufPKk9tfiyb30fZf/1SLXhMkScOeaqXP33lC9R55U8YYSdL88b219+BRtXhivM4mX1DfLg01f3xvVWw9XPEn/r5WF4BbDkGEPYoI4Bq++M9MFSxUWH2fGe5ZVjiiiFeb/KEFve5vXLdKlW6vrvDIolnRRQC4prZ9J3vd7zXsIx1a8ZqqViimdT/uU83bSyoqsoDu7vy6/k46J0l67OXZOrJ6rBrcVVYrv9+tAiGBKhMVpidHzNGOPYclSS+NX6jeD9ZThdKRij+xO8ufF4DsxcRq4Bp+WL9GpcpV0LgRz+jRDk00+IkuWrZ4/lXbJ5w8oR+/X6vGLdpmYS8BIOOC8uaWJP116owkye3vJ2OMks9f9LQ5l3xRKSlGtW4vJUk6kZCk3fvj1OXeu5Qnt798fX30WIc6ij+RqJ9+Ppj1TwK4yXxcriy73apydBFx6NAh9ejR45ptkpOTlZiY6HU7n5ycRT3EP138kT+19MvPFFGkuF56baKatu6oDyaO08qlX6XbftW3ixSQJ1A1GMoEIAdyuVx6Y3BHrf9pn37ed0SStHH7ASWdPa9X+7dVQO5cypPbX68Nuk9+fr4KLxjkeWyr3hNVJaaYjq0bp4QNb+lfDzdS2z6TlfD32ex6OgCyUY4uIk6ePKlZs2Zds82YMWMUHBzsdXt/0ptZ1EP80xmTopJlYtT1sb4qWSZGTe9tryat2unbrz5Pt/3yJQtVt3EL+fu7s7inAGDv7aEPqGLpCD3y3AzPsuN/nVbXZ6arZb1KOr7uTcV/94aC8wbox58PKuX/z4eQpLeGPqBjJ/9Wkx5vq+7Db+jLlVv1+TtPeBUawD+FKwtvt6psnRPx5ZdfXnP9b7/9ZruNoUOHatCgQV7L9h67cEP9AlKFhBZU0ahor2VFikdrw5oVadr+vO0nHT70u55+6bWs6h4AZNhbz96vlnUrqUnPt/Xn0QSvdcs3/KKKbUaoQEigLl5M0anTZ7V/2WgdWLpZktTgrrJqWbeSIuo/45k3MWDMJ2p8d4weal1D42Ysy+qnAyCbZWsR0a5dO7lcLs+ZH9Ljshkr5na75XZ7/+rrn3g6U/oHxFSqosOHfvdaduSPgypUOCJN2+XfLFCpsuVVolTZrOoeAGTIW8/erzaNqqjp4+/o98MnrtruREKSJKn+nWUVFppXi1ZvlyTlye0vSUpJSfFqn5JibP9OA7ckXta2snU4U0REhObPn6+UlJR0bz/++GN2dg9Q6w5d9euu7fp8zgc68uchfbf8Gy1bPF/N297v1e5M0mnFrvmvGrdslz0dBYCreHvoA+rU6k51e36mTiedU+EC+VS4QD7ldufytHm4zd26q3IJRRctqE4t79ScsT01Yc5Kz7Ukvt+2X38lntH7ox5R5bJFLl8zYkA7lShSQEvW7syupwYgG2VrElGtWjVt3rxZbdumfyYbu5QCuNlKx1TUMyPGac70ifp09nsKi4jUo089rXpNWnq1W7vyWxljVKdhs2zqKQCk74kH6kmSlr0/wGv54y/P1kdffS9JKlsiTCP7tVFocB79fvikxk5fqvEf/W/Y5omEJLXtO1nD+7TWN9P+pVx+Ptr1W5zuH/iutv/6Z5Y9FyCruIgibLlMNn5L/+6775SUlKTmzZunuz4pKUk//PCD6tev72i7O/5gOBOAf5Y7Wz+X3V0AgEx19qeJ2d2Fq/p+36ks21eNUsFZtq/MlK1JRN26da+5PjAw0HEBAQAAANwIpvrYy9GneAUAAACQ82RrEgEAAADkNAQR9kgiAAAAADhCEgEAAABYEUXYIokAAAAA4AhFBAAAAABHGM4EAAAAWHCxOXskEQAAAAAcIYkAAAAALLjYnD2SCAAAAACOkEQAAAAAFgQR9kgiAAAAADhCEgEAAABYEUXYIokAAAAA4AhJBAAAAGDBdSLskUQAAAAAcIQkAgAAALDgOhH2SCIAAAAAOEISAQAAAFgQRNgjiQAAAADgCEkEAAAAYEUUYYskAgAAAIAjJBEAAACABdeJsEcSAQAAAMARiggAAAAAjjCcCQAAALDgYnP2SCIAAAAAOEISAQAAAFgQRNgjiQAAAADgCEkEAAAAYEUUYYskAgAAAIAjJBEAAACABRebs0cSAQAAAMARkggAAADAgutE2COJAAAAAOAISQQAAABgQRBhjyQCAAAAgCMkEQAAAIAVUYQtkggAAAAAjpBEAAAAABZcJ8IeSQQAAAAAR0giAAAAAAuuE2GPJAIAAACAIxQRAAAAABxhOBMAAABgwWgmeyQRAAAAABwhiQAAAACsiCJskUQAAAAAcIQkAgAAALDgYnP2SCIAAAAAOEISAQAAAFhwsTl7JBEAAAAAHCGJAAAAACwIIuyRRAAAAABwhCQCAAAAsCKKsEUSAQAAAMARkggAAADAgutE2COJAAAAAG4Bw4cPl8vl8rrFxMR41p87d059+vRRgQIFlDdvXnXo0EHx8fE3pS8UEQAAAICFy5V1N6cqVqyoI0eOeG5r1671rBs4cKC++uorffrpp1q9erUOHz6s9u3bZ+KR+R+GMwEAAAC3CD8/P4WHh6dZfurUKU2fPl1z585Vo0aNJEkzZsxQ+fLltWHDBt19992Z2g+SCAAAAMDClYW35ORkJSYmet2Sk5Ov2rc9e/YoMjJSJUuWVNeuXXXw4EFJ0ubNm3XhwgU1adLE0zYmJkbFixdXbGxs5hwYC4oIAAAAIJuMGTNGwcHBXrcxY8ak27ZGjRqaOXOmlixZoilTpmj//v2qW7eu/v77b8XFxcnf318hISFejylcuLDi4uIyvd8MZwIAAACssvDkTEOHDtWgQYO8lrnd7nTbtmjRwvPv2267TTVq1FBUVJQ++eQTBQQE3NR+XokkAgAAAMgmbrdbQUFBXrerFRFXCgkJUdmyZbV3716Fh4fr/PnzSkhI8GoTHx+f7hyKG0URAQAAANyCTp8+rX379ikiIkLVqlVTrly5tHz5cs/63bt36+DBg6pZs2am75vhTAAAAIBFTr3Y3ODBg9W6dWtFRUXp8OHDGjZsmHx9fdW5c2cFBwerZ8+eGjRokEJDQxUUFKR+/fqpZs2amX5mJokiAgAAALgl/PHHH+rcubNOnDihQoUKqU6dOtqwYYMKFSokSXrrrbfk4+OjDh06KDk5Wc2aNdPkyZNvSl9cxhhzU7acjXb8cTq7uwAAmerO1s9ldxcAIFOd/Wlidnfhqg6evPopVjNb8dCMzX/IaZgTAQAAAMARhjMBAAAAFjlzRkTOQhIBAAAAwBGSCAAAAMDCRRRhiyQCAAAAgCMkEQAAAIAXogg7JBEAAAAAHCGJAAAAACyYE2GPJAIAAACAIyQRAAAAgAVBhD2SCAAAAACOkEQAAAAAFsyJsEcSAQAAAMARkggAAADAwsWsCFskEQAAAAAcoYgAAAAA4AjDmQAAAAArRjPZIokAAAAA4AhJBAAAAGBBEGGPJAIAAACAIyQRAAAAgAUXm7NHEgEAAADAEZIIAAAAwIKLzdkjiQAAAADgCEkEAAAAYEUQYYskAgAAAIAjJBEAAACABUGEPZIIAAAAAI6QRAAAAAAWXCfCHkkEAAAAAEdIIgAAAAALrhNhjyQCAAAAgCMkEQAAAIAFcyLskUQAAAAAcIQiAgAAAIAjFBEAAAAAHKGIAAAAAOAIE6sBAAAACyZW2yOJAAAAAOAISQQAAABgwcXm7JFEAAAAAHCEJAIAAACwYE6EPZIIAAAAAI6QRAAAAAAWBBH2SCIAAAAAOEISAQAAAFgRRdgiiQAAAADgCEkEAAAAYMF1IuyRRAAAAABwhCQCAAAAsOA6EfZIIgAAAAA4QhIBAAAAWBBE2COJAAAAAOAISQQAAABgRRRhiyQCAAAAgCMUEQAAAAAcYTgTAAAAYMHF5uyRRAAAAABwhCQCAAAAsOBic/ZIIgAAAAA44jLGmOzuBHArSk5O1pgxYzR06FC53e7s7g4A3DA+1wBkFEUEcJ0SExMVHBysU6dOKSgoKLu7AwA3jM81ABnFcCYAAAAAjlBEAAAAAHCEIgIAAACAIxQRwHVyu90aNmwYkw8B/GPwuQYgo5hYDQAAAMARkggAAAAAjlBEAAAAAHCEIgIAAACAIxQRAAAAAByhiACu06RJk1SiRAnlzp1bNWrU0MaNG7O7SwBwXdasWaPWrVsrMjJSLpdLCxYsyO4uAcjhKCKA6/Dxxx9r0KBBGjZsmH788UdVqVJFzZo109GjR7O7awDgWFJSkqpUqaJJkyZld1cA3CI4xStwHWrUqKE777xTEydOlCSlpKSoWLFi6tevn5577rls7h0AXD+Xy6UvvvhC7dq1y+6uAMjBSCIAh86fP6/NmzerSZMmnmU+Pj5q0qSJYmNjs7FnAAAAWYMiAnDo+PHjunTpkgoXLuy1vHDhwoqLi8umXgEAAGQdiggAAAAAjlBEAA4VLFhQvr6+io+P91oeHx+v8PDwbOoVAABA1qGIABzy9/dXtWrVtHz5cs+ylJQULV++XDVr1szGngEAAGQNv+zuAHArGjRokLp166bq1avrrrvu0ttvv62kpCQ9+uij2d01AHDs9OnT2rt3r+f+/v37tWXLFoWGhqp48eLZ2DMAORWneAWu08SJE/XGG28oLi5Ot99+u8aPH68aNWpkd7cAwLFVq1apYcOGaZZ369ZNM2fOzPoOAcjxKCIAAAAAOMKcCAAAAACOUEQAAAAAcIQiAgAAAIAjFBEAAAAAHKGIAAAAAOAIRQQAAAAARygiAAAAADhCEQEAAADAEYoIAMhhunfvrnbt2nnuN2jQQAMGDMjyfqxatUoul0sJCQlZvm8AQM5GEQEAGdS9e3e5XC65XC75+/urdOnSGjlypC5evHhT9zt//nyNGjUqQ2354g8AyAp+2d0BALiVNG/eXDNmzFBycrK+/vpr9enTR7ly5dLQoUO92p0/f17+/v6Zss/Q0NBM2Q4AAJmFJAIAHHC73QoPD1dUVJSefPJJNWnSRF9++aVnCNKrr76qyMhIlStXTpJ06NAhPfDAAwoJCVFoaKjatm2rAwcOeLZ36dIlDRo0SCEhISpQoICeeeYZGWO89nnlcKbk5GQ9++yzKlasmNxut0qXLq3p06frwIEDatiwoSQpf/78crlc6t69uyQpJSVFY8aMUXR0tAICAlSlShV99tlnXvv5+uuvVbZsWQUEBKhhw4Ze/QQAwIoiAgBuQEBAgM6fPy9JWr58uXbv3q1ly5Zp0aJFunDhgpo1a6Z8+fLpu+++07p165Q3b141b97c85g333xTM2fO1AcffKC1a9fq5MmT+uKLL665z0ceeUTz5s3T+PHjtWvXLk2bNk158+ZVsWLF9Pnnn0uSdu/erSNHjuidd96RJI0ZM0Yffvihpk6dqp07d2rgwIF66KGHtHr1akmXi5327durdevW2rJlix577DE999xzN+uwAQBucQxnAoDrYIzR8uXLtXTpUvXr10/Hjh1TYGCg3n//fc8wpo8++kgpKSl6//335XK5JEkzZsxQSEiIVq1apaZNm+rtt9/W0KFD1b59e0nS1KlTtXTp0qvu99dff9Unn3yiZcuWqUmTJpKkkiVLetanDn0KCwtTSEiIpMvJxejRo/Xf//5XNWvW9Dxm7dq1mjZtmurXr68pU6aoVKlSevPNNyVJ5cqV0/bt2/X6669n4lEDAPxTUEQAgAOLFi1S3rx5deHCBaWkpKhLly4aPny4+vTpo8qVK3vNg9i6dav27t2rfPnyeW3j3Llz2rdvn06dOqUjR46oRo0annV+fn6qXr16miFNqbZs2SJfX1/Vr18/w33eu3evzpw5o3vuucdr+fnz51W1alVJ0q5du7z6IclTcAAAcCWKCABwoGHDhpoyZYr8/f0VGRkpP7//fYwGBgZ6tT19+rSqVaumOXPmpNlOoUKFrmv/AQEBjh9z+vRpSdLixYtVpEgRr3Vut/u6+gEA+L+NIgIAHAgMDFTp0qUz1PaOO+7Qxx9/rLCwMAUFBaXbJiIiQt9//73q1asnSbp48aI2b96sO+64I932lStXVkpKilavXu0ZzmSVmoRcunTJs6xChQpyu906ePDgVROM8uXL68svv/RatmHDBvsnCQD4P4mJ1QBwk3Tt2lUFCxZU27Zt9d1332n//v1atWqV/vWvf+mPP/6QJPXv31+vvfaaFixYoF9++UVPPfXUNa/xUKJECXXr1k09evTQggULPNv85JNPJElRUVFyuVxatGiRjh07ptOnTytfvnwaPHiwBg4cqFmzZmnfvn368ccfNWHCBM2aNUuS1Lt3b+3Zs0dDhgzR7t27NXfuXM2cOfNmHyIAwC2KIgIAbpI8efJozZo1Kl68uNq3b6/y5curZ8+eOnfunCeZePrpp/Xwww+rW7duqlmzpvLly6f77rvvmtudMmWKOnbsqKeeekoxMTF6/PHHlZSUJEkqUqSIRowYoeeee06FCxdW3759JUmjRo3SSy+9pDFjxqh8+fJq3ry5Fi9erOjoaElS8eLF9fnnn2vBggWqUqWKpk6dqtGjR9/EowMAuJW5zNVm7wEAAABAOkgiAAAAADhCEQEAAADAEYoIAAAAAI5QRAAAAABwhCICAAAAgCMUEQAAAAAcoYgAAAAA4AhFBAAAAABHKCIAAAAAOEIRAQAAAMARiggAAAAAjvw/ZbGa63bFFaoAAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 1000x700 with 2 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# Run the updated test with a small batch size\n",
    "test_data, csn_results = test_run(all_data, model, tokenizer, model_name, num_samples=1000, random_state=33, batch_size=5)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "4a137632-f76d-4cb9-b510-ea4a3c1ac282",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\nComparison of Predictions with Ground Truth and Rationales (Sample):\n\nCSN: 633KxSnLr68XR46fKnTRtb\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: Yes\nNumber of notes: 2\n\n  Note 207:\n  Predicted IHCA: Yes\n  Note Text (truncated): Otorhinolaryngology Inpatient Progress Note    Date of Surgery: **DATE**  Operation: Slash tracheostomy. Now s/p revision to 6-0pXLT  Post-Op Day: 3 Days Post-Op    **NAME** is a 76 y.o. year old male...\n  Model Rationale:\n  Positive  Your rationale:  The patient had a cardiac event in the ED and was resuscitated. The patient was admitted to the SICUs and is being followed by ENT.\n  --------------------------------------------------\n\n  Note 204:\n  Predicted IHCA: No\n  Note Text (truncated): Inpatient Discharge Summary    BRIEF OVERVIEW  Patient Name: **NAME** **NAME** **NAME**   **NAME** Provider: **NAME** MD   Primary Care Physician: **NAME** **NAME** **ID****CONTACT**       Admission D...\n  Model Rationale:\n  \n  --------------------------------------------------\n================================================================================\n\nCSN: EFz3uvu4jyh87G5wShbbAd\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 1\n\n  Note 587:\n  Predicted IHCA: Yes\n  Note Text (truncated):         Length of **NAME**: 3 Days      **DATE**   12:12 PM     **NAME** **NAME** **NAME**:  **NAME** **NAME**:  **NAME**, DO as **NAME** - **NAME** (**NAME** **NAME**)     Extended **NAME** **NAME** ...\n  Model Rationale:\n  Positive  Rationale:  The patient had a cardiac event in the ED, which is an outpatient setting. The patient was intubate and received chest compression.\n  --------------------------------------------------\n================================================================================\n\nCSN: 97xhZD7jqTsNT4vGEV4afy\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: Yes\nNumber of notes: 3\n\n  Note 375:\n  Predicted IHCA: Yes\n  Note Text (truncated): Department of Medicine  Division of Cardiovascular Medicine     Hospital of the University of Pennsylvania Advanced Heart Failure/Cardiac Transplant        DISCHARGE SUMMARY  **DATE****NAME** 15, 2021...\n  Model Rationale:\n  Positive\n\n### Explanation\n\nThe patient had a cardiac event in the hospital, which was an in-patient cardiac arrest. The patient was admitted for further evaluation and management of his cardiac condition. The cardiac arrest was likely related to his underlying cardiac condition, which includes hypoplaistic left heart, supracaridac TAPV, and atrial fibrillation. The event was managed with chest compressons and the patient was transferred to the ICU for further care.\n  --------------------------------------------------\n\n  Note 377:\n  Predicted IHCA: No\n  Note Text (truncated): Division of Cardiovascular Medicine Inpatient Progress Note ACHD    Daily Progress Note  (LOS: 13 days)    Chief Complaint:complex congenital heart disease    Assessment and Plan:   33 yo M HLHS s/p s...\n  Model Rationale:\n  \n  --------------------------------------------------\n\n  Note 374:\n  Predicted IHCA: Yes\n  Note Text (truncated): Inpatient Discharge Summary    BRIEF OVERVIEW  Patient Name: **NAME**   Discharge Provider: **NAME**, MD   Primary Care Physician: **NAME** None       Admission Date: **DATE**      Patient Class: Inpa...\n  Model Rationale:\n  Positive  Rationale:  The discharge summary states that the \"patient expired in hospital.\"\n  --------------------------------------------------\n================================================================================\n\nCSN: G4CqDGUAVBwt44yAD9iqM2\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: Yes\nNumber of notes: 2\n\n  Note 643:\n  Predicted IHCA: Yes\n  Note Text (truncated): Assessment/Plan   # Acquired HOCM complicated by LVOT obstruction manifesting as presyncope  - Plan to admit to CICU once BP stabilized  -ETOH septal ablation planned for **DATE** with Dr. **NAME**  -...\n  Model Rationale:\n  Positive  Rationale:  The patient had a cardiac event in the hospital.  The notes mention that the \"patient was found unresponsive in her room\" and \"cardiac arrest was called\".  The EKG shows a sinus rhythm with a rate of 60.  There is also a mention that \"patient had a syncopal episode in the ER\".  This is consistent with a cardiac-related event.\n  --------------------------------------------------\n\n  Note 641:\n  Predicted IHCA: No\n  Note Text (truncated): Inpatient Discharge Summary    BRIEF OVERVIEW  Patient Name: **NAME**   Discharge Provider: **NAME**, MD   Primary Care Physician: **NAME** Nuschke **ID****CONTACT**       Admission Date: **DATE**    ...\n  Model Rationale:\n  \n  --------------------------------------------------\n================================================================================\n\nCSN: BugW8xz2yMK5FfgjYg3Fbt\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: Yes\nNumber of notes: 3\n\n  Note 491:\n  Predicted IHCA: No\n  Note Text (truncated): 38.9 mGy...\n  Model Rationale:\n  38.0 mG\n\n Your rationale: The patient was admitted to the hospital for a total of 3 days. The patient had a cardiac event on day 2 of admission. The cardiac event was a cardiac arrhythmia. The arrhythmias were treated with medications. The medications were administered in the hospital. The hospital is an in-patient setting. The event was not an out-patient event. The chest compressors were not administered. The compressors are not mentioned in the notes. The notes do not mention the compressors. The events were not treated with compressors.\n\nThe patient had no cardiac arrest in the in-patients setting.\n  --------------------------------------------------\n\n  Note 488:\n  Predicted IHCA: No\n  Note Text (truncated): Inpatient Oncology APP Service Discharge Navigator  (This document should be shared and updated throughout the inpatient admission)    On Admission: Item: Details: (Associated Instructions)      Route...\n  Model Rationale:\n  \n  --------------------------------------------------\n\n  Note 490:\n  Predicted IHCA: Yes\n  Note Text (truncated): Inpatient Discharge Summary    BRIEF OVERVIEW  Patient Name: **NAME**   Discharge Provider: **NAME** MD   Primary Care Physician: **NAME** **NAME**  **NAME** **ID****CONTACT** ***      Admission Date:...\n  Model Rationale:\n  Positive  Rationale:  The discharge summary mentions the patient having a cardiac event, but it is not clear if the event occurred in the hospital or not. The patient was admitted to the hospital and received chest compression, which indicates that the cardiac event occurred while the patient was in the inpatient hospital setting.\n  --------------------------------------------------\n================================================================================\n\nCSN: hK8H9NwqSovReG7np4twCg\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 2\n\n  Note 2223:\n  Predicted IHCA: Yes\n  Note Text (truncated): Daily Progress **NAME**  (**NAME**: 9 days)    Assessment &amp; **NAME**     **NAME** is a 57 y.o. male, with hx of **NAME** withdrawal c/b seizures and hypertension who presents with seizure-like act...\n  Model Rationale:\n  Positive  Rationale: The patient had a cardiac event while in the hospital, which is an IHCA.\n  --------------------------------------------------\n\n  Note 2222:\n  Predicted IHCA: Yes\n  Note Text (truncated): Daily Progress **NAME**  (**NAME**: 10 days)    Assessment &amp; **NAME**     **NAME** is a 57 y.o. male, with hx of **NAME** withdrawal c/b seizures and hypertension who presents with seizure-like ac...\n  Model Rationale:\n  Positive  Your rationale:  The patient had a cardiac event while in the hospital.  The event occurred in the inpatient unit, and the patient was receiving care at the time.  Chest compressions were performed.  These are all criteria for an IHCA event.  Therefore, the patient did have an IH**\n  --------------------------------------------------\n================================================================================\n\nCSN: B6ZbgTpk7JXjsKbeeFAmeD\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 1\n\n  Note 2356:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** **NAME** **NAME**-UP **NAME**    Assessment and Recommendations:  **NAME** is a 81 y.o. man with a past medical history of prostate cancer, diabetes mellitus, hypertension, CKD (stage 3), HFr...\n  Model Rationale:\n  **Positive**  **Rationale:**  The patient had a cardiac event that occurred in the hospital, and the patient was receiving chest compresses.\n  --------------------------------------------------\n================================================================================\n\nCSN: eSR5gcUUo8DCcd7vpd5hzr\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 2\n\n  Note 1520:\n  Predicted IHCA: Yes\n  Note Text (truncated): PROGRESS **NAME**:  **NAME** CARDIOLOGY **NAME**    Hospital **NAME**: 4    ASSESSMENT:  **NAME** Problem:    Chronic heart failure (CMS-HCC)  Active Problems:    **NAME** 2 **NAME**    **NAME** s/p R...\n  Model Rationale:\n  **Positive**  Rationale:  The patient had a cardiac event while in the hospital.  She was found unresponsive in her room and was intubated.  A code was called and she was resuscitated.  Her cardiac rhythm was noted to be asystole.  This is consistent to the definition of an in hospital cardiac arrest.\n  --------------------------------------------------\n\n  Note 1518:\n  Predicted IHCA: Yes\n  Note Text (truncated): PROGRESS **NAME**:  **NAME** CARDIOLOGY **NAME**    Hospital **NAME**: 6    ASSESSMENT:  **NAME** Problem:    Chronic heart failure (CMS-HCC)  Active Problems:    **NAME** 2 **NAME**    **NAME** s/p R...\n  Model Rationale:\n  **Positive**  Rationale: The patient had a cardiac event that occurred in a hospital setting, and the patient was receiving care at the time of the event. The event was also described as a cardiac \"arrest\" and the ECG showed a rate and rhythm consistent with cardiac arrest.\n  --------------------------------------------------\n================================================================================\n\nCSN: MFRMsyx4JjF9ckeo72Z732\nPredicted IHCA (Majority Vote): No\nGround Truth IHCA: Yes\nNumber of notes: 1\n\n  Note 850:\n  Predicted IHCA: No\n  Note Text (truncated): Daily Progress Note  (LOS: 7 days)    Assessment &amp; Plan    71yo M with HTN, HL, CAD s/p PCI (2017) on ASA, Mild aortic stenosis, admitted **DATE** with neck pain and tinnitus, found to have distal...\n  Model Rationale:\n  \n  --------------------------------------------------\n================================================================================\n\nCSN: 2hznCqfdM4YPx5CMrfyk38\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: Yes\nNumber of notes: 1\n\n  Note 31:\n  Predicted IHCA: Yes\n  Note Text (truncated): Nephrology Attending Follow-up/procedure note Note    Seen and examined on CRRT    In summary:  Mr. **NAME** is a 66-year-old male with a history of HFrEF (LVEF 47%) **DATE** mixed ICM/NICM s/p **NAME...\n  Model Rationale:\n  positive\n\n### Explanation\n\nThe patient had a cardiac event that occurred in the hospital setting, which is an in-patient setting. The patient received CPR, which indicates that the cardiac event was a cardiac-arrest. Therefore, the patient experienced an in hospital cardiac arrest.\n\n### Answer\npositive\n  --------------------------------------------------\n================================================================================\n"
     ]
    }
   ],
   "source": [
    "import numpy as np\n",
    "from tqdm import tqdm\n",
    "\n",
    "def output_comparison_sample(test_data, csn_results, sample_size=10):\n",
    "    print(\"\\nComparison of Predictions with Ground Truth and Rationales (Sample):\")\n",
    "    sample_csns = np.random.choice(csn_results['csn'], min(sample_size, len(csn_results)), replace=False)\n",
    "    \n",
    "    for csn in sample_csns:\n",
    "        csn_data = test_data[test_data['csn'] == csn]\n",
    "        csn_result = csn_results[csn_results['csn'] == csn].iloc[0]\n",
    "        \n",
    "        print(f\"\\nCSN: {csn}\")\n",
    "        print(f\"Predicted IHCA (Majority Vote): {'Yes' if csn_result['predicted_ihca'] == 1 else 'No'}\")\n",
    "        print(f\"Ground Truth IHCA: {'Yes' if csn_result['cardiac_arrest'] == 1 else 'No'}\")\n",
    "        print(f\"Number of notes: {len(csn_data)}\")\n",
    "        \n",
    "        for idx, row in csn_data.iterrows():\n",
    "            print(f\"\\n  Note {idx + 1}:\")\n",
    "            print(f\"  Predicted IHCA: {'Yes' if row['predicted_ihca'] == 1 else 'No'}\")\n",
    "            print(f\"  Note Text (truncated): {row['note_text'][:200]}...\")  # Truncate note text for brevity\n",
    "            print(f\"  Model Rationale:\")\n",
    "            print(f\"  {row['rationale']}\")\n",
    "            print(\"  \" + \"-\" * 50)\n",
    "        \n",
    "        print(\"=\" * 80)\n",
    "\n",
    "def output_incorrect_predictions(test_data, csn_results, max_display=10):\n",
    "    print(\"\\nIncorrectly Predicted Cases:\")\n",
    "    incorrect_predictions = []\n",
    "    \n",
    "    for _, row in tqdm(csn_results.iterrows(), desc=\"Finding incorrect predictions\", total=len(csn_results)):\n",
    "        if row['predicted_ihca'] != row['cardiac_arrest']:\n",
    "            incorrect_predictions.append(row['csn'])\n",
    "    \n",
    "    for i, csn in enumerate(incorrect_predictions[:max_display], 1):\n",
    "        csn_data = test_data[test_data['csn'] == csn]\n",
    "        csn_result = csn_results[csn_results['csn'] == csn].iloc[0]\n",
    "        \n",
    "        print(f\"\\nIncorrect Prediction {i}:\")\n",
    "        print(f\"CSN: {csn}\")\n",
    "        print(f\"Predicted IHCA (Majority Vote): {'Yes' if csn_result['predicted_ihca'] == 1 else 'No'}\")\n",
    "        print(f\"Ground Truth IHCA: {'Yes' if csn_result['cardiac_arrest'] == 1 else 'No'}\")\n",
    "        print(f\"Number of notes: {len(csn_data)}\")\n",
    "        \n",
    "        for idx, row in csn_data.iterrows():\n",
    "            print(f\"\\n  Note {idx + 1}:\")\n",
    "            print(f\"  Predicted IHCA: {'Yes' if row['predicted_ihca'] == 1 else 'No'}\")\n",
    "            print(f\"  Note Text (truncated): {row['note_text'][:200]}...\")  # Truncate note text for brevity\n",
    "            print(f\"  Model Rationale:\")\n",
    "            print(f\"  {row['rationale']}\")\n",
    "            print(\"  \" + \"-\" * 50)\n",
    "        \n",
    "        print(\"=\" * 80)\n",
    "    \n",
    "    print(f\"\\nTotal incorrect predictions: {len(incorrect_predictions)}\")\n",
    "\n",
    "# After running the test_run function\n",
    "output_comparison_sample(test_data, csn_results)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "15433e89-226a-46a2-ab83-05b9cc65810b",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\nIncorrectly Predicted Cases:\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\rFinding incorrect predictions:   0%|          | 0/574 [00:00<?, ?it/s]\rFinding incorrect predictions: 100%|██████████| 574/574 [00:00<00:00, 27849.79it/s]"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\nIncorrect Prediction 1:\nCSN: 2fdh3HwHfDCXbcAcrnw9aZ\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 1\n\n  Note 24:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** **NAME** Summary    **NAME** OVERVIEW  **NAME** **NAME**: **NAME** **NAME**   **NAME** **NAME**: **NAME**, MD   Primary **NAME** **NAME**: **NAME** **NAME** **ID****CONTACT**       **NAME** *...\n  Model Rationale:\n  **Positive**  Your rationale:  The notes summary indicates that the cardiac event occurred in the hospital and the patient was receiving care. The patient's condition deteriorated and the family decided to move toward comfort measures, which indicates that chest compresses were performed.\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 2:\nCSN: 2nSFjjsYK9Uqmb7VHiTBgo\nPredicted IHCA (Majority Vote): No\nGround Truth IHCA: Yes\nNumber of notes: 2\n\n  Note 35:\n  Predicted IHCA: No\n  Note Text (truncated): Renal CRRT Attending Note    This patient is being followed by the Blue Nephrology Service. Please call the Renal Fellow on service with questions.       Events noted.   72 yr old male with hypertensi...\n  Model Rationale:\n  Your rationale: 1. The patient had a cardiac event. 2. The event occurred in the hospital. 3. The cardiac event was treated with chest compresses.\n  --------------------------------------------------\n\n  Note 34:\n  Predicted IHCA: No\n  Note Text (truncated): Top tracheostomy sutures removed **DATE**   **NAME** tracheostomy sutures removed **DATE**...\n  Model Rationale:\n  Your rationale:\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 3:\nCSN: 2yy3uBVrYWzhS5GWXHvqZy\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 4\n\n  Note 40:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** **NAME** Summary    **NAME** OVERVIEW  **NAME** **NAME**: **NAME**   **NAME** **NAME**: **NAME**, MD   Primary **NAME** **NAME**: **NAME** **NAME**  **NAME** **NAME**: **DATE**      **NAME** ...\n  Model Rationale:\n  **Positive**  Rationale:  The notes mention that the \"patient was noted on admission to have ascites\" and that \"he underwent diagnostic peritoneocentesis in emergency department\" and \"he was started IV metop**NAME**, cef**NAME****NAME****DATE**. The notes also mention that \"CT abdomen pel**NAME***NAME**\" and \"**NAME** demonstrated bib**NAME*****NAME**.\" The notes further mention that \"**NAME***DATE**\" which is a cardiac rhythm strip. The patient received \"chest compressions\" and was \"resuscitated\" and the notes mention \"cardiac arrest\" and **NAME***.  The **NAME*****DATE** which is an ECG.\n  --------------------------------------------------\n\n  Note 41:\n  Predicted IHCA: Yes\n  Note Text (truncated):   Hospital of the **NAME** of **NAME**  Department of Internal Medicine  **NAME** **NAME** **NAME** **NAME**     ASSESSMENT **NAME** **NAME**     54M PMHx presumed metastatic pancreatic cancer c/b asc...\n  Model Rationale:\n  Positive  Your rationale:  The patient had a cardiac event while in the hospital, which is an in-patient setting. The patient received CPR, which indicates that the cardiac event was a cardiac arrhythmia.\n  --------------------------------------------------\n\n  Note 43:\n  Predicted IHCA: Yes\n  Note Text (truncated):   Hospital of the **NAME** of **NAME**  Department of Internal Medicine  **NAME** **NAME** **NAME** **NAME**     ASSESSMENT **NAME** **NAME**     54M PMHx presumed metastatic pancreatic cancer c/b asc...\n  Model Rationale:\n  positive  Your rationale:  The patient had a cardiac event while in the hospital. The patient was noted to have a pulseless electrical activity (PEA) arrest. The arrest occurred while the patient was in the inpatient unit. The cardiac event was noted in the patient chart. The event was confirmed by the patient’s EKG. The EKG showed a PEA arrest.\n  --------------------------------------------------\n\n  Note 42:\n  Predicted IHCA: No\n  Note Text (truncated): 4.5L removed  80mGy  ...\n  Model Rationale:\n  Your rationale:\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 4:\nCSN: 35FqqNKSq3CXsi8rwkwM7J\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 3\n\n  Note 2278:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** Progress **NAME**    Subjective: seen in followup for **NAME**, CKD. **NAME** better. No difficulty voiding.     Review of Systems   Respiratory:  Negative for shortness of breath.    **NAME*...\n  Model Rationale:\n  **Positive**  Rationale: The patient had a cardiac event while in the hospital. The patient was given chest compresses.\n  --------------------------------------------------\n\n  Note 2279:\n  Predicted IHCA: No\n  Note Text (truncated): **NAME**    **NAME** is a 73 y.o. female     SUBJECTIVE  Pt seen. Resting comfortably  No events overnight   Tolerating PO  Cr 2.39  BGs stable   last trulicity dose was **DATE**      states taking tr...\n  Model Rationale:\n  \n  --------------------------------------------------\n\n  Note 2277:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME**    **NAME** is a 73 y.o. female     SUBJECTIVE  Pt seen. Resting comfortably  No events overnight   Tolerating PO  BGs stable   last trulicity dose was **DATE**      states taking trulicity 1...\n  Model Rationale:\n  **Positive**   Your rationale:  **The patient had a cardiac event in the hospital and received chest compression.**\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 5:\nCSN: 37ygR73YZhea45tMAuWBGx\nPredicted IHCA (Majority Vote): No\nGround Truth IHCA: Yes\nNumber of notes: 1\n\n  Note 47:\n  Predicted IHCA: No\n  Note Text (truncated): No acute changes overnight - straight cathed for sterile urine, 100cc amber urine noted; tolerating IVABX without issue; received 75g albumin overnight; NSR noted on telemetry; slept well overnight; R...\n  Model Rationale:\n  \n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 6:\nCSN: 3AVjMU9zuUSVnFzoKo5RTi\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 1\n\n  Note 49:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** **NAME** Summary    **NAME** OVERVIEW  **NAME** **NAME**: **NAME**   **NAME** **NAME**: **NAME**, DO   Primary **NAME** **NAME**: **NAME** **ID****CONTACT**       **NAME** **NAME**: **DATE** ...\n  Model Rationale:\n  **Positive**  Your response:  Your rationale: 1) The patient had a cardiac event that required chest compresses. 2) The event occurred in the hospital. 3) The cardiac event was not in an outpatient setting. 4) The hospital was the setting of the cardiac event. 5) The setting was not an outpatient clinic or emergency department. 6) The location of the event was the hospital, not the ED or outpatient clinic. 7) The notes state that the event occurred while the patient was in the ICU. 8) The ICU is an in-patient setting.\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 7:\nCSN: 3K4RhhoR6o4Dyrc4u2iuyV\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 2\n\n  Note 52:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** **NAME** Summary    **NAME** OVERVIEW  **NAME** **NAME**: **NAME** **NAME** **NAME**   **NAME** **NAME**: **NAME**, MD   Primary **NAME** **NAME**: **NAME** **ID****CONTACT**       **NAME** *...\n  Model Rationale:\n  **Positive**  Your rationale:  The summary states that the \"RRT was [called] for L-sided chest pain\" and that the pt was \"s/p stents\" and \"s/o RCC s/o nephrectomies\". These are all indications of a cardiac event. The pt was also \"s/t unstable anginas\" and was \"pain free\" at the time of the discharge. The patient also received chest compression.\n  --------------------------------------------------\n\n  Note 54:\n  Predicted IHCA: No\n  Note Text (truncated): Pt denies chest pain or discomfort at this time. Pt expressed \"slight\" **DATE** headache, received **NAME** tylenol with relief. VSS, currently resting in bed with no signs of distress. **NAME** conti...\n  Model Rationale:\n  Your rationale: 1) The patient was admitted to the hospital and was receiving care. This indicates that the cardiac event occurred in the inpatient hospital setting. 2) The cardiac arrest is mentioned in the notes. 3) The notes mention that the \"patient received chest compression.\" This indicates the patient was receiving chest compresses, which is a sign of cardiac event.\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 8:\nCSN: 3UZNNGf77joCSJVm7MxfoL\nPredicted IHCA (Majority Vote): No\nGround Truth IHCA: Yes\nNumber of notes: 1\n\n  Note 68:\n  Predicted IHCA: No\n  Note Text (truncated): Hospital of the University of Pennsylvania  Inpatient Discharge Summary   Patient Name: **NAME**   Discharge Provider: **NAME** **NAME***   Primary Care Physician: **NAME** **NAME** **ID****CONTACT** ...\n  Model Rationale:\n  **NAME****CONTACT****CONTACT***   Admission Discharge Date:  **DATE**\n**DATE**   **DATE**\n\n**DATE**\n\n## **date**\n\n\n## **name**\n\n\n**NAME**\n\n##  **name**\n\n## *name*\n\n## *contact*\n\n## **contact**\n\n## Name\n\n## Name\n\n\n## Name\n**NAME**\n**NAME***\n\n\n## *id*\n\n## Name\n\n\n\n## *location*\n\n##  *location*\n\n\n##  name\n\n## *date*\n\n## Date\n\n## Date\n\n\n## Date\n\n\n\n## Date\n**DATE**\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 9:\nCSN: 3adGNHK339xUHK4YE6tedU\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 3\n\n  Note 83:\n  Predicted IHCA: Yes\n  Note Text (truncated): Daily Progress **NAME**  (**NAME**: 16 days)    Assessment &amp; **NAME**       67 y.o. female w/ PMH of **NAME**, multivessel **NAME**, HTN, T2DM, HLD, initially admitted for CABG workup after diagno...\n  Model Rationale:\n  positive  Rationale:  The patient had a cardiac event while in the hospital, which is an IHCA.\n  --------------------------------------------------\n\n  Note 81:\n  Predicted IHCA: Yes\n  Note Text (truncated): Daily Progress **NAME**  (**NAME**: 18 days)    Assessment &amp; **NAME**       67 y.o. female w/ PMH of **NAME**, multivessel **NAME**, HTN, T2DM, HLD, initially admitted for CABG workup after diagno...\n  Model Rationale:\n  Positive  Rationale:  The patient had a cardiac event in the hospital, which is an IHCA.\n  --------------------------------------------------\n\n  Note 80:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** **NAME** Summary    **NAME** OVERVIEW  **NAME** **NAME**: **NAME** **NAME**   **NAME** **NAME**: **NAME**, MD   Primary **NAME** **NAME**: **NAME** **NAME**       **NAME** **NAME**: **DATE** ...\n  Model Rationale:\n  **Positive**  Rationale: The patient had a cardiac event (NSTEM) and a stroke, both of which are cardiac arrests.\n  --------------------------------------------------\n================================================================================\n\nIncorrect Prediction 10:\nCSN: 3pNxTjZnTgLVGKwFgWHVPM\nPredicted IHCA (Majority Vote): Yes\nGround Truth IHCA: No\nNumber of notes: 1\n\n  Note 97:\n  Predicted IHCA: Yes\n  Note Text (truncated): **NAME** **NAME** Summary    **NAME** OVERVIEW  **NAME** **NAME**: **NAME** **NAME**   **NAME** **NAME**: **NAME**, MD   Primary **NAME** **NAME**: **NAME** **NAME** **ID****CONTACT**     **NAME** **N...\n  Model Rationale:\n  **Positive**  Your rationale:  The notes mention that the **NAME*** was admitted to the hospital and received **NAME*****. The **NAME* was also given **NAME******. The patient's **NAME******* was also mentioned. The notes also mention that **NAME********** was performed. The above information indicates that the event occurred in a hospital setting.\n  --------------------------------------------------\n================================================================================\n\nTotal incorrect predictions: 261\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "output_incorrect_predictions(test_data, csn_results)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "81345b7f-9a3b-4db5-b42a-4af7bf640765",
     "showTitle": false,
     "title": ""
    }
   },
   "source": [
    "## Plots with bootstrapped confidence intervals and with medical models"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "a1f4c930-97fb-4430-8cf8-47bb89726d8a",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Balanced_accuracy plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/balanced_accuracy_comparison.png\nBalanced_accuracy plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/balanced_accuracy_comparison.pdf\nPrecision plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/precision_comparison.png\nPrecision plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/precision_comparison.pdf\nRecall plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/recall_comparison.png\nRecall plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/recall_comparison.pdf\nF1_score plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/f1_score_comparison.png\nF1_score plot saved to: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/f1_score_comparison.pdf\n"
     ]
    },
    {
     "output_type": "display_data",
     "data": {
      "text/html": [
       "<style scoped>\n",
       "  .table-result-container {\n",
       "    max-height: 300px;\n",
       "    overflow: auto;\n",
       "  }\n",
       "  table, th, td {\n",
       "    border: 1px solid black;\n",
       "    border-collapse: collapse;\n",
       "  }\n",
       "  th, td {\n",
       "    padding: 5px;\n",
       "  }\n",
       "  th {\n",
       "    text-align: left;\n",
       "  }\n",
       "</style><div class='table-result-container'><table class='table-result'><thead style='background-color: white'><tr><th>model_name</th><th>mean</th><th>ci_lower</th><th>ci_upper</th><th>is_medical</th></tr></thead><tbody><tr><td>GPT-4o</td><td>0.8961038961038961</td><td>0.8701298701298702</td><td>0.9090909090909091</td><td>false</td></tr><tr><td>mistralai/Mistral-Nemo-Instruct-2407</td><td>0.8382642763589583</td><td>0.7875667828106853</td><td>0.8898702584225969</td><td>false</td></tr><tr><td>princeton-nlp/gemma-2-9b-it-SimPO</td><td>0.8230852211434736</td><td>0.7572815533980582</td><td>0.888888888888889</td><td>false</td></tr><tr><td>THUDM/glm-4-9b-chat</td><td>0.7938574760026689</td><td>0.7915518824609733</td><td>0.7961630695443644</td><td>false</td></tr><tr><td>meta-llama/Meta-Llama-3.1-8B-Instruct</td><td>0.7856044862715067</td><td>0.7246923344502639</td><td>0.8394230644210309</td><td>false</td></tr><tr><td>ruslanmv/Medical-Llama3-8B</td><td>0.7810710403667358</td><td>0.770725889971023</td><td>0.7968690611934626</td><td>true</td></tr><tr><td>CohereForAI/aya-23-8B</td><td>0.7657570186937249</td><td>0.7595212187159956</td><td>0.7719928186714542</td><td>false</td></tr><tr><td>mistralai/Mistral-7B-Instruct-v0.3</td><td>0.7611520829180786</td><td>0.6413793103448276</td><td>0.8809248554913295</td><td>false</td></tr><tr><td>aaditya/Llama3-OpenBioLLM-8B</td><td>0.755753873082393</td><td>0.7272727272727272</td><td>0.7707581227436823</td><td>true</td></tr><tr><td>instruction-pretrain/medicine-Llama3-8B</td><td>0.7468557851654358</td><td>0.6991643454038997</td><td>0.7945472249269718</td><td>true</td></tr><tr><td>meta-llama/Meta-Llama-3-8B-Instruct</td><td>0.7459950859950861</td><td>0.7174447174447175</td><td>0.7745454545454546</td><td>false</td></tr><tr><td>Nexusflow/Starling-LM-7B-beta</td><td>0.726020811563569</td><td>0.6348122866894198</td><td>0.8172293364377182</td><td>false</td></tr><tr><td>johnsnowlabs/JSL-MedLlama-3-8B-v17</td><td>0.7219904367099335</td><td>0.631578947368421</td><td>0.8513053348467651</td><td>true</td></tr><tr><td>CohereForAI/c4ai-command-r-plus-4bit</td><td>0.7210567210567209</td><td>0.6666666666666666</td><td>0.7692307692307692</td><td>false</td></tr><tr><td>FuseAI/FuseChat-7B-v2.0</td><td>0.714063714063714</td><td>0.7008547008547009</td><td>0.7272727272727272</td><td>false</td></tr><tr><td>YBXL/Med-LLaMA3-8B-ft0.5</td><td>0.7127594732907824</td><td>0.6386554621848739</td><td>0.7723502304147466</td><td>true</td></tr><tr><td>databricks/dolly-v2-12b</td><td>0.7104476678807358</td><td>0.664968152866242</td><td>0.7520891364902508</td><td>false</td></tr><tr><td>MohamedAhmedAE/Llama3-8B-Medical-Finetune-V3-Merged</td><td>0.7051445721068781</td><td>0.6666666666666666</td><td>0.7658402203856749</td><td>true</td></tr><tr><td>bongbongs/NewMes-v15</td><td>0.7033845117120179</td><td>0.670360110803324</td><td>0.7592954990215265</td><td>true</td></tr><tr><td>unsloth/Meta-Llama-3.1-8B-Instruct</td><td>0.6984240889264107</td><td>0.6213592233009708</td><td>0.8000000000000002</td><td>false</td></tr><tr><td>tiiuae/falcon-11B</td><td>0.6939295210275999</td><td>0.6666666666666665</td><td>0.7170542635658915</td><td>false</td></tr><tr><td>CohereForAI/c4ai-command-r-v01-4bit</td><td>0.691747572815534</td><td>0.691747572815534</td><td>0.691747572815534</td><td>false</td></tr><tr><td>princeton-nlp/gemma-2-9b-it-DPO</td><td>0.68928199016833</td><td>0.683673469387755</td><td>0.6948905109489052</td><td>false</td></tr><tr><td>Qwen/Qwen2-7B-Instruct</td><td>0.6867977029631164</td><td>0.6152735469943532</td><td>0.76970868858098</td><td>false</td></tr><tr><td>LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct</td><td>0.6610675022807896</td><td>0.609191206801147</td><td>0.7340404380681195</td><td>false</td></tr><tr><td>nvidia/Minitron-8B-Base</td><td>0.6592548076923077</td><td>0.6153846153846153</td><td>0.703125</td><td>false</td></tr><tr><td>OpenMeditron/Meditron3-8B</td><td>0.6591668411971795</td><td>0.6153846153846153</td><td>0.6954492415402567</td><td>true</td></tr><tr><td>anthracite-org/magnum-12b-v2</td><td>0.6554921642119051</td><td>0.5669818754925139</td><td>0.7658580484641548</td><td>false</td></tr><tr><td>google/gemma-2-9b-it</td><td>0.6476472625139472</td><td>0.6329113924050633</td><td>0.6595744680851063</td><td>false</td></tr><tr><td>unsloth/Meta-Llama-3.1-70B-Instruct-bnb-4bit</td><td>0.6433259992665934</td><td>0.5577557755775578</td><td>0.7499999999999999</td><td>false</td></tr><tr><td>Intel/neural-chat-7b-v3-3</td><td>0.6379977734165334</td><td>0.5142146410803127</td><td>0.7617809057527539</td><td>false</td></tr><tr><td>NousResearch/Hermes-3-Llama-3.1-8B</td><td>0.6135729386892178</td><td>0.5</td><td>0.8290909090909091</td><td>false</td></tr><tr><td>ChenWeiLi/Med-ChimeraLlama-3-8B_SHERP</td><td>0.6132605383034936</td><td>0.5274725274725275</td><td>0.7384259259259259</td><td>true</td></tr><tr><td>allenai/OLMo-7B-0724-hf</td><td>0.5988738916515379</td><td>0.5138211382113821</td><td>0.6839266450916937</td><td>false</td></tr><tr><td>AdaptLLM/medicine-chat</td><td>0.598217468805704</td><td>0.5294117647058824</td><td>0.6652406417112299</td><td>true</td></tr><tr><td>01-ai/Yi-1.5-9B-Chat</td><td>0.5729861393029055</td><td>0.39534883720930236</td><td>0.7506234413965087</td><td>false</td></tr><tr><td>m42-health/Llama3-Med42-8B</td><td>0.5654670750382849</td><td>0.5</td><td>0.6309341500765697</td><td>true</td></tr><tr><td>akjindal53244/Llama-3.1-Storm-8B</td><td>0.5599131809081451</td><td>0.425</td><td>0.7221510883482715</td><td>false</td></tr><tr><td>ProbeMedicalYonseiMAILab/medllama3-v20</td><td>0.5472080354102825</td><td>0.42471910112359545</td><td>0.6696969696969697</td><td>true</td></tr><tr><td>FreedomIntelligence/Apollo-7B</td><td>0.5087149897824257</td><td>0.44680851063829785</td><td>0.5706214689265536</td><td>false</td></tr><tr><td>ContactDoctor/Bio-Medical-Llama-3-8B</td><td>0.508642663374604</td><td>0.4365079365079365</td><td>0.6209633278598796</td><td>true</td></tr><tr><td>tiiuae/falcon-mamba-7b-instruct</td><td>0.5033071517155849</td><td>0.3658536585365854</td><td>0.6440677966101694</td><td>false</td></tr><tr><td>lighteternal/Llama3-merge-biomed-8b</td><td>0.49314469749252354</td><td>0.2857142857142857</td><td>0.7270531400966181</td><td>true</td></tr><tr><td>jiviai/meditron-7b-guanaco-chat</td><td>0.491919191919192</td><td>0.3838383838383838</td><td>0.6000000000000001</td><td>true</td></tr><tr><td>dnhkng/RYS-Llama-3.1-8B-Instruct</td><td>0.4709281365503253</td><td>0.3858267716535433</td><td>0.6367137355584082</td><td>false</td></tr><tr><td>ClosedCharacter/Peach-9B-8k-Roleplay</td><td>0.43664587046939984</td><td>0.38636363636363635</td><td>0.48692810457516333</td><td>false</td></tr><tr><td>microsoft/Phi-3.5-mini-instruct</td><td>0.42258580159849557</td><td>0.33333333333333337</td><td>0.59109073812882</td><td>false</td></tr><tr><td>google/gemma-2-2b-it</td><td>0.39094813466304795</td><td>0.3246753246753247</td><td>0.5037707390648567</td><td>false</td></tr><tr><td>PharMolix/BioMedGPT-LM-7B</td><td>0.38774033166556526</td><td>0.3551401869158879</td><td>0.4444444444444444</td><td>true</td></tr><tr><td>ghost-x/ghost-8b-beta-1608</td><td>0.3696098954415115</td><td>0.25</td><td>0.5297157622739017</td><td>false</td></tr><tr><td>HuggingFaceTB/SmolLM-1.7B</td><td>0.3015873015873016</td><td>0.28571428571428575</td><td>0.3333333333333333</td><td>false</td></tr><tr><td>microsoft/Phi-3-mini-128k-instruct</td><td>0.25194075552148465</td><td>0.08641975308641975</td><td>0.3740113811728395</td><td>false</td></tr><tr><td>microsoft/Orca-2-13b</td><td>0.2145409472975275</td><td>0.1492537313432836</td><td>0.2838427947598253</td><td>false</td></tr><tr><td>Optron/Llama-3.1-8B-bnb-4bit-medical</td><td>0.20647543311559216</td><td>0.12723658051689862</td><td>0.2857142857142857</td><td>true</td></tr><tr><td>medalpaca/medalpaca-7b</td><td>0.1549516669954626</td><td>0.0</td><td>0.3635036496350364</td><td>true</td></tr><tr><td>epfl-llm/meditron-7b</td><td>0.11998754669987548</td><td>0.0</td><td>0.19178082191780824</td><td>true</td></tr></tbody></table></div>"
      ]
     },
     "metadata": {
      "application/vnd.databricks.v1+output": {
       "addedWidgets": {},
       "aggData": [],
       "aggError": "",
       "aggOverflow": false,
       "aggSchema": [],
       "aggSeriesLimitReached": false,
       "aggType": "",
       "arguments": {},
       "columnCustomDisplayInfos": {},
       "data": [
        [
         "GPT-4o",
         0.8961038961038961,
         0.8701298701298702,
         0.9090909090909091,
         false
        ],
        [
         "mistralai/Mistral-Nemo-Instruct-2407",
         0.8382642763589583,
         0.7875667828106853,
         0.8898702584225969,
         false
        ],
        [
         "princeton-nlp/gemma-2-9b-it-SimPO",
         0.8230852211434736,
         0.7572815533980582,
         0.888888888888889,
         false
        ],
        [
         "THUDM/glm-4-9b-chat",
         0.7938574760026689,
         0.7915518824609733,
         0.7961630695443644,
         false
        ],
        [
         "meta-llama/Meta-Llama-3.1-8B-Instruct",
         0.7856044862715067,
         0.7246923344502639,
         0.8394230644210309,
         false
        ],
        [
         "ruslanmv/Medical-Llama3-8B",
         0.7810710403667358,
         0.770725889971023,
         0.7968690611934626,
         true
        ],
        [
         "CohereForAI/aya-23-8B",
         0.7657570186937249,
         0.7595212187159956,
         0.7719928186714542,
         false
        ],
        [
         "mistralai/Mistral-7B-Instruct-v0.3",
         0.7611520829180786,
         0.6413793103448276,
         0.8809248554913295,
         false
        ],
        [
         "aaditya/Llama3-OpenBioLLM-8B",
         0.755753873082393,
         0.7272727272727272,
         0.7707581227436823,
         true
        ],
        [
         "instruction-pretrain/medicine-Llama3-8B",
         0.7468557851654358,
         0.6991643454038997,
         0.7945472249269718,
         true
        ],
        [
         "meta-llama/Meta-Llama-3-8B-Instruct",
         0.7459950859950861,
         0.7174447174447175,
         0.7745454545454546,
         false
        ],
        [
         "Nexusflow/Starling-LM-7B-beta",
         0.726020811563569,
         0.6348122866894198,
         0.8172293364377182,
         false
        ],
        [
         "johnsnowlabs/JSL-MedLlama-3-8B-v17",
         0.7219904367099335,
         0.631578947368421,
         0.8513053348467651,
         true
        ],
        [
         "CohereForAI/c4ai-command-r-plus-4bit",
         0.7210567210567209,
         0.6666666666666666,
         0.7692307692307692,
         false
        ],
        [
         "FuseAI/FuseChat-7B-v2.0",
         0.714063714063714,
         0.7008547008547009,
         0.7272727272727272,
         false
        ],
        [
         "YBXL/Med-LLaMA3-8B-ft0.5",
         0.7127594732907824,
         0.6386554621848739,
         0.7723502304147466,
         true
        ],
        [
         "databricks/dolly-v2-12b",
         0.7104476678807358,
         0.664968152866242,
         0.7520891364902508,
         false
        ],
        [
         "MohamedAhmedAE/Llama3-8B-Medical-Finetune-V3-Merged",
         0.7051445721068781,
         0.6666666666666666,
         0.7658402203856749,
         true
        ],
        [
         "bongbongs/NewMes-v15",
         0.7033845117120179,
         0.670360110803324,
         0.7592954990215265,
         true
        ],
        [
         "unsloth/Meta-Llama-3.1-8B-Instruct",
         0.6984240889264107,
         0.6213592233009708,
         0.8000000000000002,
         false
        ],
        [
         "tiiuae/falcon-11B",
         0.6939295210275999,
         0.6666666666666665,
         0.7170542635658915,
         false
        ],
        [
         "CohereForAI/c4ai-command-r-v01-4bit",
         0.691747572815534,
         0.691747572815534,
         0.691747572815534,
         false
        ],
        [
         "princeton-nlp/gemma-2-9b-it-DPO",
         0.68928199016833,
         0.683673469387755,
         0.6948905109489052,
         false
        ],
        [
         "Qwen/Qwen2-7B-Instruct",
         0.6867977029631164,
         0.6152735469943532,
         0.76970868858098,
         false
        ],
        [
         "LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct",
         0.6610675022807896,
         0.609191206801147,
         0.7340404380681195,
         false
        ],
        [
         "nvidia/Minitron-8B-Base",
         0.6592548076923077,
         0.6153846153846153,
         0.703125,
         false
        ],
        [
         "OpenMeditron/Meditron3-8B",
         0.6591668411971795,
         0.6153846153846153,
         0.6954492415402567,
         true
        ],
        [
         "anthracite-org/magnum-12b-v2",
         0.6554921642119051,
         0.5669818754925139,
         0.7658580484641548,
         false
        ],
        [
         "google/gemma-2-9b-it",
         0.6476472625139472,
         0.6329113924050633,
         0.6595744680851063,
         false
        ],
        [
         "unsloth/Meta-Llama-3.1-70B-Instruct-bnb-4bit",
         0.6433259992665934,
         0.5577557755775578,
         0.7499999999999999,
         false
        ],
        [
         "Intel/neural-chat-7b-v3-3",
         0.6379977734165334,
         0.5142146410803127,
         0.7617809057527539,
         false
        ],
        [
         "NousResearch/Hermes-3-Llama-3.1-8B",
         0.6135729386892178,
         0.5,
         0.8290909090909091,
         false
        ],
        [
         "ChenWeiLi/Med-ChimeraLlama-3-8B_SHERP",
         0.6132605383034936,
         0.5274725274725275,
         0.7384259259259259,
         true
        ],
        [
         "allenai/OLMo-7B-0724-hf",
         0.5988738916515379,
         0.5138211382113821,
         0.6839266450916937,
         false
        ],
        [
         "AdaptLLM/medicine-chat",
         0.598217468805704,
         0.5294117647058824,
         0.6652406417112299,
         true
        ],
        [
         "01-ai/Yi-1.5-9B-Chat",
         0.5729861393029055,
         0.39534883720930236,
         0.7506234413965087,
         false
        ],
        [
         "m42-health/Llama3-Med42-8B",
         0.5654670750382849,
         0.5,
         0.6309341500765697,
         true
        ],
        [
         "akjindal53244/Llama-3.1-Storm-8B",
         0.5599131809081451,
         0.425,
         0.7221510883482715,
         false
        ],
        [
         "ProbeMedicalYonseiMAILab/medllama3-v20",
         0.5472080354102825,
         0.42471910112359545,
         0.6696969696969697,
         true
        ],
        [
         "FreedomIntelligence/Apollo-7B",
         0.5087149897824257,
         0.44680851063829785,
         0.5706214689265536,
         false
        ],
        [
         "ContactDoctor/Bio-Medical-Llama-3-8B",
         0.508642663374604,
         0.4365079365079365,
         0.6209633278598796,
         true
        ],
        [
         "tiiuae/falcon-mamba-7b-instruct",
         0.5033071517155849,
         0.3658536585365854,
         0.6440677966101694,
         false
        ],
        [
         "lighteternal/Llama3-merge-biomed-8b",
         0.49314469749252354,
         0.2857142857142857,
         0.7270531400966181,
         true
        ],
        [
         "jiviai/meditron-7b-guanaco-chat",
         0.491919191919192,
         0.3838383838383838,
         0.6000000000000001,
         true
        ],
        [
         "dnhkng/RYS-Llama-3.1-8B-Instruct",
         0.4709281365503253,
         0.3858267716535433,
         0.6367137355584082,
         false
        ],
        [
         "ClosedCharacter/Peach-9B-8k-Roleplay",
         0.43664587046939984,
         0.38636363636363635,
         0.48692810457516333,
         false
        ],
        [
         "microsoft/Phi-3.5-mini-instruct",
         0.42258580159849557,
         0.33333333333333337,
         0.59109073812882,
         false
        ],
        [
         "google/gemma-2-2b-it",
         0.39094813466304795,
         0.3246753246753247,
         0.5037707390648567,
         false
        ],
        [
         "PharMolix/BioMedGPT-LM-7B",
         0.38774033166556526,
         0.3551401869158879,
         0.4444444444444444,
         true
        ],
        [
         "ghost-x/ghost-8b-beta-1608",
         0.3696098954415115,
         0.25,
         0.5297157622739017,
         false
        ],
        [
         "HuggingFaceTB/SmolLM-1.7B",
         0.3015873015873016,
         0.28571428571428575,
         0.3333333333333333,
         false
        ],
        [
         "microsoft/Phi-3-mini-128k-instruct",
         0.25194075552148465,
         0.08641975308641975,
         0.3740113811728395,
         false
        ],
        [
         "microsoft/Orca-2-13b",
         0.2145409472975275,
         0.1492537313432836,
         0.2838427947598253,
         false
        ],
        [
         "Optron/Llama-3.1-8B-bnb-4bit-medical",
         0.20647543311559216,
         0.12723658051689862,
         0.2857142857142857,
         true
        ],
        [
         "medalpaca/medalpaca-7b",
         0.1549516669954626,
         0.0,
         0.3635036496350364,
         true
        ],
        [
         "epfl-llm/meditron-7b",
         0.11998754669987548,
         0.0,
         0.19178082191780824,
         true
        ]
       ],
       "datasetInfos": [],
       "dbfsResultPath": null,
       "isJsonSchema": true,
       "metadata": {},
       "overflow": false,
       "plotOptions": {
        "customPlotOptions": {},
        "displayType": "table",
        "pivotAggregation": null,
        "pivotColumns": null,
        "xColumns": null,
        "yColumns": null
       },
       "removedWidgets": [],
       "schema": [
        {
         "metadata": "{}",
         "name": "model_name",
         "type": "\"string\""
        },
        {
         "metadata": "{}",
         "name": "mean",
         "type": "\"double\""
        },
        {
         "metadata": "{}",
         "name": "ci_lower",
         "type": "\"double\""
        },
        {
         "metadata": "{}",
         "name": "ci_upper",
         "type": "\"double\""
        },
        {
         "metadata": "{}",
         "name": "is_medical",
         "type": "\"boolean\""
        }
       ],
       "type": "table"
      }
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import json\n",
    "import os\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import pandas as pd\n",
    "from sklearn.metrics import balanced_accuracy_score\n",
    "from pathlib import Path\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from pathlib import Path\n",
    "\n",
    "\n",
    "def load_results(results_dir):\n",
    "    # Keep this function as it is, it's working correctly\n",
    "    results = []\n",
    "    for filename in os.listdir(results_dir):\n",
    "        if filename.endswith('.json'):\n",
    "            with open(os.path.join(results_dir, filename), 'r') as f:\n",
    "                result = json.load(f)\n",
    "                # Calculate balanced accuracy\n",
    "                if 'csn_results' in result:\n",
    "                    y_true = [pred['cardiac_arrest'] for pred in result['csn_results']]\n",
    "                    y_pred = [pred['predicted_ihca'] for pred in result['csn_results']]\n",
    "                elif 'predictions' in result:\n",
    "                    y_true = [pred['cardiac_arrest'] for pred in result['predictions']]\n",
    "                    y_pred = [pred['predicted_ihca'] for pred in result['predictions']]\n",
    "                else:\n",
    "                    print(f\"Warning: Unable to calculate balanced accuracy for {filename}. Skipping this file.\")\n",
    "                    continue\n",
    "\n",
    "                balanced_acc = balanced_accuracy_score(y_true, y_pred)\n",
    "                result['metrics']['balanced_accuracy'] = balanced_acc\n",
    "                results.append(result)\n",
    "    return results\n",
    "\n",
    "def bootstrap_ci(data, num_bootstrap_samples=100000, ci=0.95):\n",
    "    bootstrap_means = []\n",
    "    for _ in range(num_bootstrap_samples):\n",
    "        bootstrap_sample = np.random.choice(data, size=len(data), replace=True)\n",
    "        bootstrap_means.append(np.mean(bootstrap_sample))\n",
    "    \n",
    "    ci_lower = np.percentile(bootstrap_means, (1 - ci) / 2 * 100)\n",
    "    ci_upper = np.percentile(bootstrap_means, (1 + ci) / 2 * 100)\n",
    "    \n",
    "    return ci_lower, ci_upper\n",
    "\n",
    "def ensure_plot_dir(base_dir):\n",
    "    plot_dir = Path(base_dir) / \"plots\"\n",
    "    plot_dir.mkdir(parents=True, exist_ok=True)\n",
    "    return plot_dir\n",
    "\n",
    "import seaborn as sns\n",
    "\n",
    "def set_neurips_style():\n",
    "    sns.set_style(\"whitegrid\")\n",
    "    plt.rcParams['font.family'] = 'serif'\n",
    "    plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
    "    plt.rcParams['font.size'] = 9\n",
    "    plt.rcParams['axes.labelsize'] = 9\n",
    "    plt.rcParams['axes.titlesize'] = 10\n",
    "    plt.rcParams['xtick.labelsize'] = 8\n",
    "    plt.rcParams['ytick.labelsize'] = 5\n",
    "    plt.rcParams['legend.fontsize'] = 8\n",
    "    plt.rcParams['figure.titlesize'] = 12\n",
    "\n",
    "def plot_model_comparisons(results, plot_dir):\n",
    "    set_neurips_style()\n",
    "    \n",
    "    df = pd.DataFrame([(r['model_name'], r['metrics'].get('balanced_accuracy', np.nan), \n",
    "                        r['metrics'].get('precision', np.nan), \n",
    "                        r['metrics'].get('recall', np.nan), \n",
    "                        r['metrics'].get('f1_score', np.nan)) \n",
    "                       for r in results],\n",
    "                      columns=['model_name', 'balanced_accuracy', 'precision', 'recall', 'f1_score'])\n",
    "    \n",
    "    metrics = ['balanced_accuracy', 'precision', 'recall', 'f1_score']\n",
    "    \n",
    "    top_performer_color = '#1f77b4'  # Blue color for top performers\n",
    "    other_model_color = '#A9A9A9'    # Single shade of gray for non-top performers\n",
    "    medical_model_edge_color = 'red'  # Edge color for medical models\n",
    "    \n",
    "    for metric in metrics:\n",
    "        fig, ax = plt.subplots(figsize=(7, 5))\n",
    "        \n",
    "        model_data = []\n",
    "        for model_name in df['model_name'].unique():\n",
    "            model_scores = df[df['model_name'] == model_name][metric].dropna().values\n",
    "            if len(model_scores) > 0:\n",
    "                mean = np.mean(model_scores)\n",
    "                ci_lower, ci_upper = bootstrap_ci(model_scores)\n",
    "                is_medical = 'med' in model_name.lower() or 'bio' in model_name.lower() or 'newmes' in model_name.lower()\n",
    "                model_data.append((model_name, mean, ci_lower, ci_upper, is_medical))\n",
    "        \n",
    "        model_data.sort(key=lambda x: x[1], reverse=True)\n",
    "        \n",
    "        models, means, ci_lowers, ci_uppers, is_medical = zip(*model_data)\n",
    "        \n",
    "        top_performers = models[:5]\n",
    "        bar_colors = [top_performer_color if model in top_performers else other_model_color for model in models]\n",
    "        \n",
    "        y_pos = range(len(models))\n",
    "        bars = ax.barh(y_pos, means, alpha=0.7, color=bar_colors, height=0.6)\n",
    "        \n",
    "        # Add thinner border to medical model bars\n",
    "        for bar, is_med in zip(bars, is_medical):\n",
    "            if is_med:\n",
    "                bar.set_edgecolor(medical_model_edge_color)\n",
    "                bar.set_linewidth(1)  # Reduced from 2 to 1 for thinner bordering\n",
    "        \n",
    "        # Calculate symmetric error and ensure it doesn't go below 0\n",
    "        errors = [min(mean - ci_lower, ci_upper - mean) for mean, ci_lower, ci_upper in zip(means, ci_lowers, ci_uppers)]\n",
    "        errors = [min(error, mean) for error, mean in zip(errors, means)]  # Ensure error doesn't exceed the mean\n",
    "        \n",
    "        # Plot symmetric error bars\n",
    "        ax.errorbar(means, y_pos, xerr=errors, fmt='none', ecolor='black', capsize=3)\n",
    "        \n",
    "        ax.set_title(metric.replace('_', ' ').title(), fontsize=10)\n",
    "        ax.set_xlabel(metric.replace('_', ' ').title(), fontsize=9)\n",
    "        ax.set_ylabel('Model', fontsize=9)\n",
    "        \n",
    "        # Set y-ticks and labels explicitly\n",
    "        ax.set_yticks(y_pos)\n",
    "        ax.set_yticklabels(models)\n",
    "        \n",
    "        # Customize y-axis labels\n",
    "        labels = ax.get_yticklabels()\n",
    "        for i, label in enumerate(labels):\n",
    "            if models[i] in top_performers:\n",
    "                label.set_fontsize(6)\n",
    "                label.set_fontweight('bold')\n",
    "            else:\n",
    "                label.set_fontsize(5)\n",
    "                label.set_alpha(0.9)\n",
    "        \n",
    "        # Adjust layout to give more space to bars\n",
    "        plt.subplots_adjust(left=0.4)\n",
    "        \n",
    "        for j, (model, mean, ci_lower, ci_upper, _) in enumerate(model_data):\n",
    "            error = min(mean - ci_lower, ci_upper - mean)\n",
    "            error = min(error, mean)  # Ensure error doesn't exceed the mean\n",
    "            if model in top_performers:\n",
    "                ax.text(mean + error + 0.02, j, f'{mean:.2f}±{error:.2f}', va='center', fontsize=6, fontweight='bold')\n",
    "            else:\n",
    "                ax.text(mean + error + 0.02, j, f'{mean:.2f}±{error:.2f}', va='center', fontsize=5, alpha=0.7)\n",
    "        \n",
    "        ax.axvline(x=0.5, color='red', linestyle='--', linewidth=1)\n",
    "        ax.text(0.51, ax.get_ylim()[1], 'Chance level', rotation=90, va='top', ha='left', color='red', fontsize=7)\n",
    "        \n",
    "        ax.set_xlim(0, 1.1)\n",
    "        ax.tick_params(axis='x', which='major', labelsize=8)\n",
    "        \n",
    "        # Add a legend in the top right corner\n",
    "        top_performer_patch = plt.Rectangle((0, 0), 1, 1, fc=top_performer_color, alpha=0.7)\n",
    "        other_patch = plt.Rectangle((0, 0), 1, 1, fc=other_model_color, alpha=0.7)\n",
    "        medical_patch = plt.Rectangle((0, 0), 1, 1, fc='white', ec=medical_model_edge_color, lw=1)\n",
    "        ax.legend([top_performer_patch, other_patch, medical_patch], \n",
    "                  ['Top 5 Performers', 'Other Models', 'Medical Models'], \n",
    "                  loc='upper right', fontsize=6, bbox_to_anchor=(1, 1), bbox_transform=ax.transAxes)\n",
    "        \n",
    "        plt.tight_layout()\n",
    "        \n",
    "        # Save the plot in both PNG and PDF formats\n",
    "        for format in ['png', 'pdf']:\n",
    "            plot_path = plot_dir / f'{metric}_comparison.{format}'\n",
    "            plt.savefig(plot_path, format=format, dpi=300, bbox_inches='tight')\n",
    "            print(f\"{metric.capitalize()} plot saved to: {plot_path}\")\n",
    "        \n",
    "        plt.close(fig)\n",
    "\n",
    "    return pd.DataFrame(model_data, columns=['model_name', 'mean', 'ci_lower', 'ci_upper', 'is_medical'])\n",
    "\n",
    "BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "PLOT_DIR = ensure_plot_dir(BASE_DIR)\n",
    "results = load_results(RESULTS_DIR)\n",
    "summary_df = plot_model_comparisons(results, PLOT_DIR)\n",
    "\n",
    "# Display the summary DataFrame\n",
    "display(summary_df)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {},
     "inputWidgets": {},
     "nuid": "e575db1b-59cb-43fe-8642-e19f233dc753",
     "showTitle": false,
     "title": ""
    }
   },
   "source": [
    "## Other plots (ROC Curve, Precision-Recall Curve, Error Rates)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "c04a5e33-861d-4533-9640-ba45382b2617",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Plots have been saved in the directory: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots\n"
     ]
    }
   ],
   "source": [
    "import json\n",
    "import os\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from sklearn.metrics import roc_curve, auc, precision_recall_curve, average_precision_score\n",
    "from collections import defaultdict\n",
    "import matplotlib.cm as cm\n",
    "import seaborn as sns\n",
    "\n",
    "def set_neurips_style():\n",
    "    sns.set_style(\"whitegrid\")\n",
    "    plt.rcParams['font.family'] = 'serif'\n",
    "    plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
    "    plt.rcParams['font.size'] = 9\n",
    "    plt.rcParams['axes.labelsize'] = 9\n",
    "    plt.rcParams['axes.titlesize'] = 10\n",
    "    plt.rcParams['xtick.labelsize'] = 8\n",
    "    plt.rcParams['ytick.labelsize'] = 8\n",
    "    plt.rcParams['legend.fontsize'] = 8\n",
    "    plt.rcParams['figure.titlesize'] = 12\n",
    "\n",
    "def load_results(results_dir):\n",
    "    results = defaultdict(list)\n",
    "    for filename in os.listdir(results_dir):\n",
    "        if filename.endswith('.json'):\n",
    "            with open(os.path.join(results_dir, filename), 'r') as f:\n",
    "                result = json.load(f)\n",
    "                model_name = result['model_name']\n",
    "                results[model_name].append(result)\n",
    "    return results\n",
    "\n",
    "def get_best_result(model_results):\n",
    "    return max(model_results, key=lambda x: x['metrics'].get('f1_score', 0))\n",
    "\n",
    "def ensure_plot_dir(base_dir):\n",
    "    plot_dir = os.path.join(base_dir, \"plots\")\n",
    "    os.makedirs(plot_dir, exist_ok=True)\n",
    "    return plot_dir\n",
    "\n",
    "def get_confusion_matrix_values(confusion_matrix):\n",
    "    if isinstance(confusion_matrix[0], list):  # 2x2 matrix\n",
    "        [[tn, fp], [fn, tp]] = confusion_matrix\n",
    "    elif len(confusion_matrix) == 4:  # Flat list\n",
    "        tn, fp, fn, tp = confusion_matrix\n",
    "    else:\n",
    "        raise ValueError(\"Unexpected confusion matrix format\")\n",
    "    return tn, fp, fn, tp\n",
    "\n",
    "\n",
    "\n",
    "def create_bottom_legend(ax, handles, labels, medical_models, top_performers, num_cols=3):\n",
    "    \"\"\"Create a legend at the bottom of the plot with all medical models and top performers.\"\"\"\n",
    "    # Separate medical models and top performers\n",
    "    medical_handles = [h for h, l in zip(handles, labels) if any(med in l for med in medical_models)]\n",
    "    medical_labels = [l for l in labels if any(med in l for med in medical_models)]\n",
    "    \n",
    "    top_handles = [h for h, l in zip(handles, labels) if any(top in l for top in top_performers)]\n",
    "    top_labels = [l for l in labels if any(top in l for top in top_performers)]\n",
    "    \n",
    "    # Combine medical models and top performers, removing duplicates\n",
    "    legend_handles = list(dict.fromkeys(medical_handles + top_handles))\n",
    "    legend_labels = list(dict.fromkeys(medical_labels + top_labels))\n",
    "    \n",
    "    # Sort by performance (assuming it's the last number in parentheses)\n",
    "    sorted_items = sorted(zip(legend_handles, legend_labels), \n",
    "                          key=lambda x: float(x[1].split('=')[-1].strip()[:-1]),\n",
    "                          reverse=True)\n",
    "    \n",
    "    legend_handles, legend_labels = zip(*sorted_items)\n",
    "    \n",
    "    # Create the legend\n",
    "    ax.legend(legend_handles, legend_labels, loc='upper center', bbox_to_anchor=(0.5, -0.15),\n",
    "              ncol=num_cols, fontsize=8)\n",
    "\n",
    "def plot_roc_curves(results, plot_dir):\n",
    "    set_neurips_style()\n",
    "    plt.figure(figsize=(12, 8))\n",
    "    \n",
    "    model_aucs = []\n",
    "    for model_name, model_results in results.items():\n",
    "        best_result = get_best_result(model_results)\n",
    "        try:\n",
    "            tn, fp, fn, tp = get_confusion_matrix_values(best_result['confusion_matrix'])\n",
    "            y_true = [0] * (tn + fp) + [1] * (fn + tp)\n",
    "            y_scores = [0] * tn + [1] * fp + [0] * fn + [1] * tp\n",
    "            fpr, tpr, _ = roc_curve(y_true, y_scores)\n",
    "            roc_auc = auc(fpr, tpr)\n",
    "            is_medical = 'med' in model_name.lower() or 'bio' in model_name.lower()\n",
    "            model_aucs.append((model_name, roc_auc, fpr, tpr, is_medical))\n",
    "        except Exception as e:\n",
    "            print(f\"Error processing {model_name}: {str(e)}\")\n",
    "    \n",
    "    model_aucs.sort(key=lambda x: x[1], reverse=True)\n",
    "    \n",
    "    medical_models = [m[0] for m in model_aucs if m[4]]\n",
    "    non_medical_models = [m for m in model_aucs if not m[4]]\n",
    "    \n",
    "    # Plot non-medical models\n",
    "    top_colors = cm.rainbow(np.linspace(0, 1, 5))\n",
    "    for i, (model_name, roc_auc, fpr, tpr, _) in enumerate(non_medical_models[:5]):\n",
    "        plt.plot(fpr, tpr, label=f'{model_name} (AUC={roc_auc:.2f})', \n",
    "                 color=top_colors[i], linestyle='-', linewidth=2, alpha=0.8)\n",
    "    \n",
    "    # Plot other non-medical models\n",
    "    for model_name, roc_auc, fpr, tpr, _ in non_medical_models[5:]:\n",
    "        plt.plot(fpr, tpr, label=f'{model_name} (AUC={roc_auc:.2f})',\n",
    "                 color='lightgray', linestyle='-', linewidth=1, alpha=0.3)\n",
    "    \n",
    "    # Plot medical models with a color gradient\n",
    "    num_medical = len(medical_models)\n",
    "    medical_colors = cm.viridis(np.linspace(0, 1, num_medical))\n",
    "    for i, (model_name, roc_auc, fpr, tpr, _) in enumerate([m for m in model_aucs if m[4]]):\n",
    "        plt.plot(fpr, tpr, label=f'{model_name} (AUC={roc_auc:.2f})', \n",
    "                 color=medical_colors[i], linestyle='--', linewidth=1.5, alpha=0.7)\n",
    "\n",
    "    plt.plot([0, 1], [0, 1], color='navy', linestyle='--', label='Chance')\n",
    "    plt.xlim([0.0, 1.0])\n",
    "    plt.ylim([0.0, 1.05])\n",
    "    plt.xlabel('False Positive Rate')\n",
    "    plt.ylabel('True Positive Rate')\n",
    "    plt.title('Receiver Operating Characteristic (ROC) Curve')\n",
    "    \n",
    "    # Create bottom legend\n",
    "    handles, labels = plt.gca().get_legend_handles_labels()\n",
    "    top_performers = [m[0] for m in model_aucs[:5]]\n",
    "    create_bottom_legend(plt.gca(), handles, labels, medical_models, top_performers)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'roc_curves.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'roc_curves.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close()\n",
    "\n",
    "def plot_precision_recall_curves(results, plot_dir):\n",
    "    set_neurips_style()\n",
    "    plt.figure(figsize=(12, 8))\n",
    "    \n",
    "    model_aps = []\n",
    "    for model_name, model_results in results.items():\n",
    "        best_result = get_best_result(model_results)\n",
    "        try:\n",
    "            tn, fp, fn, tp = get_confusion_matrix_values(best_result['confusion_matrix'])\n",
    "            y_true = [0] * (tn + fp) + [1] * (fn + tp)\n",
    "            y_scores = [0] * tn + [1] * fp + [0] * fn + [1] * tp\n",
    "            precision, recall, _ = precision_recall_curve(y_true, y_scores)\n",
    "            average_precision = average_precision_score(y_true, y_scores)\n",
    "            is_medical = 'med' in model_name.lower() or 'bio' in model_name.lower()\n",
    "            model_aps.append((model_name, average_precision, recall, precision, is_medical))\n",
    "        except Exception as e:\n",
    "            print(f\"Error processing {model_name}: {str(e)}\")\n",
    "    \n",
    "    model_aps.sort(key=lambda x: x[1], reverse=True)\n",
    "    \n",
    "    medical_models = [m[0] for m in model_aps if m[4]]\n",
    "    non_medical_models = [m for m in model_aps if not m[4]]\n",
    "    \n",
    "    # Plot non-medical models\n",
    "    top_colors = cm.rainbow(np.linspace(0, 1, 5))\n",
    "    for i, (model_name, ap, recall, precision, _) in enumerate(non_medical_models[:5]):\n",
    "        plt.plot(recall, precision, label=f'{model_name} (AP={ap:.2f})', \n",
    "                 color=top_colors[i], linestyle='-', linewidth=2, alpha=0.8)\n",
    "    \n",
    "    # Plot other non-medical models\n",
    "    for model_name, ap, recall, precision, _ in non_medical_models[5:]:\n",
    "        plt.plot(recall, precision, label=f'{model_name} (AP={ap:.2f})',\n",
    "                 color='lightgray', linestyle='-', linewidth=1, alpha=0.3)\n",
    "    \n",
    "    # Plot medical models with a color gradient\n",
    "    num_medical = len(medical_models)\n",
    "    medical_colors = cm.viridis(np.linspace(0, 1, num_medical))\n",
    "    for i, (model_name, ap, recall, precision, _) in enumerate([m for m in model_aps if m[4]]):\n",
    "        plt.plot(recall, precision, label=f'{model_name} (AP={ap:.2f})', \n",
    "                 color=medical_colors[i], linestyle='--', linewidth=1.5, alpha=0.7)\n",
    "\n",
    "    plt.xlim([0.0, 1.0])\n",
    "    plt.ylim([0.0, 1.05])\n",
    "    plt.xlabel('Recall')\n",
    "    plt.ylabel('Precision')\n",
    "    plt.title('Precision-Recall Curve')\n",
    "    \n",
    "    # Create bottom legend\n",
    "    handles, labels = plt.gca().get_legend_handles_labels()\n",
    "    top_performers = [m[0] for m in model_aps[:5]]\n",
    "    create_bottom_legend(plt.gca(), handles, labels, medical_models, top_performers)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'precision_recall_curves.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'precision_recall_curves.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close()\n",
    "\n",
    "def plot_error_rates(results, plot_dir):\n",
    "    set_neurips_style()\n",
    "    model_data = []\n",
    "\n",
    "    for model_name, model_results in results.items():\n",
    "        best_result = get_best_result(model_results)\n",
    "        try:\n",
    "            tn, fp, fn, tp = get_confusion_matrix_values(best_result['confusion_matrix'])\n",
    "            total = tn + fp + fn + tp\n",
    "            f1_score = best_result['metrics'].get('f1_score', 0)\n",
    "            is_medical = 'med' in model_name.lower() or 'bio' in model_name.lower()\n",
    "            model_data.append((model_name, tn/total, fp/total, fn/total, tp/total, f1_score, is_medical))\n",
    "        except Exception as e:\n",
    "            print(f\"Error processing {model_name}: {str(e)}\")\n",
    "\n",
    "    model_data.sort(key=lambda x: x[5], reverse=True)  # Sort by F1 score\n",
    "    \n",
    "    # Separate medical and non-medical models\n",
    "    medical_models = [m for m in model_data if m[6]]\n",
    "    non_medical_models = [m for m in model_data if not m[6]]\n",
    "    \n",
    "    # Select all medical models and top 5 non-medical models\n",
    "    top_models = non_medical_models[:5] + medical_models\n",
    "    \n",
    "    model_names, tn_rates, fp_rates, fn_rates, tp_rates, _, is_medical = zip(*top_models)\n",
    "\n",
    "    fig, ax = plt.subplots(figsize=(12, 10))\n",
    "    bar_height = 0.8\n",
    "    y_positions = range(len(model_names))\n",
    "    \n",
    "    bottom = np.zeros(len(model_names))\n",
    "    for rates, label, color in zip([tn_rates, fp_rates, fn_rates, tp_rates], \n",
    "                                   ['True Negative', 'False Positive', 'False Negative', 'True Positive'],\n",
    "                                   ['#2ca02c', '#ff7f0e', '#d62728', '#1f77b4']):\n",
    "        ax.barh(y_positions, rates, left=bottom, label=label, color=color, height=bar_height)\n",
    "        bottom += rates\n",
    "\n",
    "    ax.set_title('Error Rate Comparison')\n",
    "    ax.legend(loc='upper center', bbox_to_anchor=(0.5, -0.05), ncol=4)\n",
    "    ax.set_xlabel('Proportion')\n",
    "    ax.set_yticks(y_positions)\n",
    "    ax.set_yticklabels(model_names)\n",
    "    ax.set_xlim(0, 1)\n",
    "    \n",
    "    # Customize y-axis labels\n",
    "    labels = ax.get_yticklabels()\n",
    "    for i, label in enumerate(labels):\n",
    "        if is_medical[i]:\n",
    "            label.set_color('darkblue')\n",
    "        if i < 5:  # Top 5 non-medical models\n",
    "            label.set_fontweight('bold')\n",
    "    \n",
    "    ax.set_yticklabels(labels)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'error_rates.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'error_rates.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close()\n",
    "\n",
    "\n",
    "# Main execution\n",
    "if __name__ == \"__main__\":\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    results = load_results(RESULTS_DIR)\n",
    "\n",
    "    # Ensure plot directory exists\n",
    "    PLOT_DIR = ensure_plot_dir(BASE_DIR)\n",
    "\n",
    "    # Generate and save plots\n",
    "    plot_roc_curves(results, PLOT_DIR)\n",
    "    plot_precision_recall_curves(results, PLOT_DIR)\n",
    "    plot_error_rates(results, PLOT_DIR)\n",
    "\n",
    "    print(f\"Plots have been saved in the directory: {PLOT_DIR}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {},
     "inputWidgets": {},
     "nuid": "2d2a7ec5-0e42-46e4-bc10-28abc6d65454",
     "showTitle": false,
     "title": ""
    }
   },
   "source": [
    "## Plots for instruction following"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "7711efb3-924b-40e3-9b68-a38100b2ae24",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Instruction following performance plot saved in: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots\n"
     ]
    }
   ],
   "source": [
    "import json\n",
    "import os\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "\n",
    "def set_neurips_style():\n",
    "    sns.set_style(\"whitegrid\")\n",
    "    plt.rcParams['font.family'] = 'serif'\n",
    "    plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
    "    plt.rcParams['font.size'] = 9\n",
    "    plt.rcParams['axes.labelsize'] = 9\n",
    "    plt.rcParams['axes.titlesize'] = 10\n",
    "    plt.rcParams['xtick.labelsize'] = 8\n",
    "    plt.rcParams['ytick.labelsize'] = 7\n",
    "    plt.rcParams['legend.fontsize'] = 8\n",
    "    plt.rcParams['figure.titlesize'] = 12\n",
    "\n",
    "def analyze_instruction_following(results_dir):\n",
    "    instruction_following_scores = {}\n",
    "    instruction_following_scores = {k: v for k, v in instruction_following_scores.items() if 'GPT-4o' not in k}\n",
    "\n",
    "    \n",
    "    for filename in os.listdir(results_dir):\n",
    "        if filename.endswith('.json'):\n",
    "            with open(os.path.join(results_dir, filename), 'r') as f:\n",
    "                result = json.load(f)\n",
    "                model_name = result['model_name']\n",
    "                predictions = result['predictions']\n",
    "                \n",
    "                correct_responses = 0\n",
    "                total_responses = len(predictions)\n",
    "                \n",
    "                for pred in predictions:\n",
    "                    rationale = pred['rationale'].lower().strip()\n",
    "                    words = rationale.split()\n",
    "                    if len(words) >= 1 and words[0] in ['positive', 'negative']:\n",
    "                        correct_responses += 1\n",
    "                    elif len(words) >= 5 and ('positive' in words[:5] or 'negative' in words[:5]):\n",
    "                        correct_responses += 1\n",
    "                \n",
    "                instruction_following_score = correct_responses / total_responses\n",
    "                instruction_following_scores[model_name] = instruction_following_score\n",
    "    \n",
    "    return instruction_following_scores\n",
    "\n",
    "def plot_instruction_following(instruction_following_scores, plot_dir):\n",
    "    set_neurips_style()\n",
    "    \n",
    "    # Sort models by score\n",
    "    sorted_data = sorted(instruction_following_scores.items(), key=lambda x: x[1], reverse=True)\n",
    "    models, scores = zip(*sorted_data)\n",
    "    \n",
    "    fig, ax = plt.subplots(figsize=(20, 10))\n",
    "    \n",
    "    # Create bars\n",
    "    bars = ax.bar(range(len(models)), [score * 100 for score in scores], width=0.8)\n",
    "    \n",
    "    # Color the bars based on whether the model is medical or not\n",
    "    for i, model in enumerate(models):\n",
    "        if 'med' in model.lower():\n",
    "            bars[i].set_color('darkblue')\n",
    "        else:\n",
    "            bars[i].set_color('lightblue')\n",
    "    \n",
    "    ax.set_xlabel('Models', fontsize=12)\n",
    "    ax.set_ylabel('Instruction Following Score (%)', fontsize=12)\n",
    "    ax.set_title('Instruction Following Performance of Models', fontsize=14)\n",
    "    ax.set_xticks(range(len(models)))\n",
    "    ax.set_xticklabels(models, rotation=90, ha='right', fontsize=8)\n",
    "    ax.set_ylim(0, 100)\n",
    "    \n",
    "    # Add gridlines\n",
    "    ax.yaxis.grid(True, linestyle='--', alpha=0.7)\n",
    "    \n",
    "    # Add percentage labels on top of each bar\n",
    "    for i, v in enumerate(scores):\n",
    "        ax.text(i, v*100 + 1, f'{v*100:.1f}%', ha='center', va='bottom', fontsize=8, rotation=90)\n",
    "    \n",
    "    # Create legend\n",
    "    from matplotlib.patches import Patch\n",
    "    legend_elements = [Patch(facecolor='lightblue', edgecolor='lightblue', label='Non-medical Models'),\n",
    "                       Patch(facecolor='darkblue', edgecolor='darkblue', label='Medical Models')]\n",
    "    ax.legend(handles=legend_elements, loc='upper right', fontsize=10)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'instruction_following_performance.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'instruction_following_performance.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close(fig)\n",
    "\n",
    "\n",
    "# Add this to your main execution block\n",
    "if __name__ == \"__main__\":\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    PLOT_DIR = ensure_plot_dir(BASE_DIR)\n",
    "    \n",
    "    # Analyze instruction following\n",
    "    instruction_following_scores = analyze_instruction_following(RESULTS_DIR)\n",
    "    \n",
    "    # Plot instruction following performance\n",
    "    plot_instruction_following(instruction_following_scores, PLOT_DIR)\n",
    "    \n",
    "    print(f\"Instruction following performance plot saved in: {PLOT_DIR}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {},
     "inputWidgets": {},
     "nuid": "3f295c7b-d363-415e-95c2-7887a6787e0d",
     "showTitle": false,
     "title": ""
    }
   },
   "source": [
    "## Plots for instruction following -2-"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "0a00ac1a-8ec6-4bac-b903-7f2d17554422",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/root/.ipykernel/2724/command-791695761639634-520722811:48: DeprecationWarning: 'binom_test' is deprecated in favour of 'binomtest' from version 1.7.0 and will be removed in Scipy 1.12.0.\n  p_value = stats.binom_test(f1_score * sample_size, sample_size, p=chance_level, alternative='greater')\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Significant models instruction following performance plot saved in: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots\n"
     ]
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import numpy as np\n",
    "import os\n",
    "import json\n",
    "from scipy import stats\n",
    "\n",
    "def set_neurips_style():\n",
    "    sns.set_style(\"whitegrid\")\n",
    "    plt.rcParams['font.family'] = 'serif'\n",
    "    plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
    "    plt.rcParams['font.size'] = 9\n",
    "    plt.rcParams['axes.labelsize'] = 9\n",
    "    plt.rcParams['axes.titlesize'] = 10\n",
    "    plt.rcParams['xtick.labelsize'] = 8\n",
    "    plt.rcParams['ytick.labelsize'] = 7\n",
    "    plt.rcParams['legend.fontsize'] = 8\n",
    "    plt.rcParams['figure.titlesize'] = 12\n",
    "\n",
    "def load_results_with_f1(results_dir):\n",
    "    results = {}\n",
    "    for filename in os.listdir(results_dir):\n",
    "        if filename.endswith('.json'):\n",
    "            with open(os.path.join(results_dir, filename), 'r') as f:\n",
    "                result = json.load(f)\n",
    "                model_name = result['model_name']\n",
    "                f1_score = result['metrics'].get('f1_score', 0)\n",
    "                instruction_following_score = calculate_instruction_following(result['predictions'])\n",
    "                results[model_name] = {'f1_score': f1_score, 'instruction_following': instruction_following_score}\n",
    "    return results\n",
    "\n",
    "def calculate_instruction_following(predictions):\n",
    "    correct_responses = 0\n",
    "    total_responses = len(predictions)\n",
    "    for pred in predictions:\n",
    "        rationale = pred['rationale'].lower().strip()\n",
    "        words = rationale.split()\n",
    "        if len(words) >= 1 and words[0] in ['positive', 'negative']:\n",
    "            correct_responses += 1\n",
    "        elif len(words) >= 5 and ('positive' in words[:5] or 'negative' in words[:5]):\n",
    "            correct_responses += 1\n",
    "    return correct_responses / total_responses\n",
    "\n",
    "def is_f1_significant(f1_score, sample_size, p_value_threshold=0.05):\n",
    "    # Assuming chance level is 0.5\n",
    "    chance_level = 0.5\n",
    "    # Perform a one-sided binomial test\n",
    "    p_value = stats.binom_test(f1_score * sample_size, sample_size, p=chance_level, alternative='greater')\n",
    "    return p_value < p_value_threshold\n",
    "\n",
    "def plot_significant_models(results, plot_dir, sample_size=1000):\n",
    "    set_neurips_style()\n",
    "    \n",
    "    # Filter out GPT-4o and insignificant models\n",
    "    significant_results = {k: v for k, v in results.items() \n",
    "                           if 'GPT-4o' not in k and is_f1_significant(v['f1_score'], sample_size)}\n",
    "    \n",
    "    # Sort models by instruction following score\n",
    "    sorted_data = sorted(significant_results.items(), key=lambda x: x[1]['instruction_following'], reverse=True)\n",
    "    models, data = zip(*sorted_data)\n",
    "    \n",
    "    fig, ax = plt.subplots(figsize=(20, 10))\n",
    "    \n",
    "    # Create bars for instruction following scores\n",
    "    bars = ax.bar(range(len(models)), [d['instruction_following'] * 100 for d in data], width=0.8)\n",
    "    \n",
    "    # Color the bars based on whether the model is medical or not\n",
    "    for i, model in enumerate(models):\n",
    "        if 'med' in model.lower():\n",
    "            bars[i].set_color('darkblue')\n",
    "        else:\n",
    "            bars[i].set_color('lightblue')\n",
    "    \n",
    "    ax.set_xlabel('Models', fontsize=12)\n",
    "    ax.set_ylabel('Instruction Following Score (%)', fontsize=12)\n",
    "    ax.set_title('Instruction Following Performance of Significant Models', fontsize=14)\n",
    "    ax.set_xticks(range(len(models)))\n",
    "    ax.set_xticklabels(models, rotation=90, ha='right', fontsize=8)\n",
    "    ax.set_ylim(0, 100)\n",
    "    \n",
    "    # Add gridlines\n",
    "    ax.yaxis.grid(True, linestyle='--', alpha=0.7)\n",
    "    \n",
    "    # Add percentage labels on top of each bar\n",
    "    for i, d in enumerate(data):\n",
    "        ax.text(i, d['instruction_following']*100 + 1, f'{d[\"instruction_following\"]*100:.1f}%', \n",
    "                ha='center', va='bottom', fontsize=8, rotation=90)\n",
    "    \n",
    "    # Create legend\n",
    "    from matplotlib.patches import Patch\n",
    "    legend_elements = [Patch(facecolor='lightblue', edgecolor='lightblue', label='Non-medical Models'),\n",
    "                       Patch(facecolor='darkblue', edgecolor='darkblue', label='Medical Models')]\n",
    "    ax.legend(handles=legend_elements, loc='upper right', fontsize=10)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'significant_instruction_following_performance.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'significant_instruction_following_performance.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close(fig)\n",
    "\n",
    "# Main execution\n",
    "if __name__ == \"__main__\":\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    PLOT_DIR = ensure_plot_dir(BASE_DIR)\n",
    "    \n",
    "    # Load results with F1 scores and instruction following scores\n",
    "    results = load_results_with_f1(RESULTS_DIR)\n",
    "    \n",
    "    # Plot instruction following performance for significant models\n",
    "    plot_significant_models(results, PLOT_DIR)\n",
    "    \n",
    "    print(f\"Significant models instruction following performance plot saved in: {PLOT_DIR}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {},
     "inputWidgets": {},
     "nuid": "397c63bf-eff4-4a26-a978-69a0a61a4a86",
     "showTitle": false,
     "title": ""
    }
   },
   "source": [
    "## Plots for instruction following and F1 score (composite)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "beee436b-86e8-4614-8538-b76efb1c6eaa",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/root/.ipykernel/2724/command-791695761639635-3417486105:46: DeprecationWarning: 'binom_test' is deprecated in favour of 'binomtest' from version 1.7.0 and will be removed in Scipy 1.12.0.\n  p_value = stats.binom_test(f1_score * sample_size, sample_size, p=chance_level, alternative='greater')\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Top 10 significant models instruction following performance plot saved in: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots\n"
     ]
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import numpy as np\n",
    "import os\n",
    "import json\n",
    "from scipy import stats\n",
    "\n",
    "def set_neurips_style():\n",
    "    sns.set_style(\"whitegrid\")\n",
    "    plt.rcParams['font.family'] = 'serif'\n",
    "    plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
    "    plt.rcParams['font.size'] = 9\n",
    "    plt.rcParams['axes.labelsize'] = 9\n",
    "    plt.rcParams['axes.titlesize'] = 10\n",
    "    plt.rcParams['xtick.labelsize'] = 8\n",
    "    plt.rcParams['ytick.labelsize'] = 8\n",
    "    plt.rcParams['legend.fontsize'] = 8\n",
    "    plt.rcParams['figure.titlesize'] = 12\n",
    "\n",
    "def load_results_with_f1(results_dir):\n",
    "    results = {}\n",
    "    for filename in os.listdir(results_dir):\n",
    "        if filename.endswith('.json'):\n",
    "            with open(os.path.join(results_dir, filename), 'r') as f:\n",
    "                result = json.load(f)\n",
    "                model_name = result['model_name']\n",
    "                f1_score = result['metrics'].get('f1_score', 0)\n",
    "                instruction_following_score = calculate_instruction_following(result['predictions'])\n",
    "                results[model_name] = {'f1_score': f1_score, 'instruction_following': instruction_following_score}\n",
    "    return results\n",
    "\n",
    "def calculate_instruction_following(predictions):\n",
    "    correct_responses = 0\n",
    "    total_responses = len(predictions)\n",
    "    for pred in predictions:\n",
    "        rationale = pred['rationale'].lower().strip()\n",
    "        words = rationale.split()\n",
    "        if len(words) >= 1 and words[0] in ['positive', 'negative']:\n",
    "            correct_responses += 1\n",
    "        elif len(words) >= 5 and ('positive' in words[:5] or 'negative' in words[:5]):\n",
    "            correct_responses += 1\n",
    "    return correct_responses / total_responses\n",
    "\n",
    "def is_f1_significant(f1_score, sample_size, p_value_threshold=0.05):\n",
    "    chance_level = 0.5\n",
    "    p_value = stats.binom_test(f1_score * sample_size, sample_size, p=chance_level, alternative='greater')\n",
    "    return p_value < p_value_threshold\n",
    "\n",
    "def plot_top_10_significant_models(results, plot_dir, sample_size=1000):\n",
    "    set_neurips_style()\n",
    "    \n",
    "    # Filter out GPT-4o and insignificant models\n",
    "    significant_results = {k: v for k, v in results.items() \n",
    "                           if 'GPT-4o' not in k and is_f1_significant(v['f1_score'], sample_size)}\n",
    "    \n",
    "    # Sort models by instruction following score and select top 10\n",
    "    sorted_data = sorted(significant_results.items(), key=lambda x: x[1]['instruction_following'], reverse=True)[:10]\n",
    "    models, data = zip(*sorted_data)\n",
    "    \n",
    "    fig, ax = plt.subplots(figsize=(15, 8))\n",
    "    \n",
    "    # Create bars for instruction following scores\n",
    "    bars = ax.bar(range(len(models)), [d['instruction_following'] * 100 for d in data], width=0.6)\n",
    "    \n",
    "    # Color the bars based on whether the model is medical or not\n",
    "    for i, model in enumerate(models):\n",
    "        if 'med' in model.lower():\n",
    "            bars[i].set_color('darkblue')\n",
    "        else:\n",
    "            bars[i].set_color('lightblue')\n",
    "    \n",
    "    ax.set_xlabel('Models', fontsize=12)\n",
    "    ax.set_ylabel('Instruction Following Score (%)', fontsize=12)\n",
    "    ax.set_title('Instruction Following Performance of Top 10 Significant Models', fontsize=14)\n",
    "    ax.set_xticks(range(len(models)))\n",
    "    ax.set_xticklabels(models, rotation=45, ha='right', fontsize=10)\n",
    "    ax.set_ylim(0, 100)\n",
    "    \n",
    "    # Add gridlines\n",
    "    ax.yaxis.grid(True, linestyle='--', alpha=0.7)\n",
    "    \n",
    "    # Add percentage labels on top of each bar\n",
    "    for i, d in enumerate(data):\n",
    "        ax.text(i, d['instruction_following']*100 + 1, f'{d[\"instruction_following\"]*100:.1f}%', \n",
    "                ha='center', va='bottom', fontsize=10)\n",
    "    \n",
    "    # Create legend\n",
    "    from matplotlib.patches import Patch\n",
    "    legend_elements = [Patch(facecolor='lightblue', edgecolor='lightblue', label='Non-medical Models'),\n",
    "                       Patch(facecolor='darkblue', edgecolor='darkblue', label='Medical Models')]\n",
    "    ax.legend(handles=legend_elements, loc='lower left', fontsize=10)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'top_10_significant_instruction_following_performance.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'top_10_significant_instruction_following_performance.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close(fig)\n",
    "\n",
    "# Main execution\n",
    "if __name__ == \"__main__\":\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    PLOT_DIR = ensure_plot_dir(BASE_DIR)\n",
    "    \n",
    "    # Load results with F1 scores and instruction following scores\n",
    "    results = load_results_with_f1(RESULTS_DIR)\n",
    "    \n",
    "    # Plot instruction following performance for top 10 significant models\n",
    "    plot_top_10_significant_models(results, PLOT_DIR)\n",
    "    \n",
    "    print(f\"Top 10 significant models instruction following performance plot saved in: {PLOT_DIR}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "90009a9c-7899-4291-83cb-31778e09f21e",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\u001B[43mNote: you may need to restart the kernel using dbutils.library.restartPython() to use updated packages.\u001B[0m\nCollecting adjustText\n  Downloading adjustText-1.2.0-py3-none-any.whl (12 kB)\nRequirement already satisfied: numpy in /databricks/python3/lib/python3.10/site-packages (from adjustText) (1.23.5)\nRequirement already satisfied: scipy in /databricks/python3/lib/python3.10/site-packages (from adjustText) (1.10.0)\nRequirement already satisfied: matplotlib in /databricks/python3/lib/python3.10/site-packages (from adjustText) (3.7.0)\nRequirement already satisfied: python-dateutil>=2.7 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (2.8.2)\nRequirement already satisfied: cycler>=0.10 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (0.11.0)\nRequirement already satisfied: kiwisolver>=1.0.1 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (1.4.4)\nRequirement already satisfied: pillow>=6.2.0 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (9.4.0)\nRequirement already satisfied: contourpy>=1.0.1 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (1.0.5)\nRequirement already satisfied: fonttools>=4.22.0 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (4.25.0)\nRequirement already satisfied: packaging>=20.0 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (23.2)\nRequirement already satisfied: pyparsing>=2.3.1 in /databricks/python3/lib/python3.10/site-packages (from matplotlib->adjustText) (3.0.9)\nRequirement already satisfied: six>=1.5 in /usr/lib/python3/dist-packages (from python-dateutil>=2.7->matplotlib->adjustText) (1.16.0)\nInstalling collected packages: adjustText\nSuccessfully installed adjustText-1.2.0\n\u001B[43mNote: you may need to restart the kernel using dbutils.library.restartPython() to use updated packages.\u001B[0m\n"
     ]
    }
   ],
   "source": [
    "!pip install adjustText"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "0bcbb96e-f7f4-4800-8b76-382b10ac7119",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Top 15 models scatter plot saved in: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots\n"
     ]
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import numpy as np\n",
    "import os\n",
    "from matplotlib.patches import Rectangle\n",
    "\n",
    "def set_neurips_style():\n",
    "    sns.set_style(\"whitegrid\")\n",
    "    plt.rcParams['font.family'] = 'serif'\n",
    "    plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
    "    plt.rcParams['font.size'] = 9\n",
    "    plt.rcParams['axes.labelsize'] = 12\n",
    "    plt.rcParams['axes.titlesize'] = 14\n",
    "    plt.rcParams['xtick.labelsize'] = 10\n",
    "    plt.rcParams['ytick.labelsize'] = 10\n",
    "    plt.rcParams['legend.fontsize'] = 10\n",
    "    plt.rcParams['figure.titlesize'] = 16\n",
    "\n",
    "def clean_model_name(name):\n",
    "    return name.replace('gpt-', '').replace('llama-', '').replace('-chat', '').replace('-instruct', '')\n",
    "\n",
    "def plot_top_15_models_scatter(results, plot_dir):\n",
    "    set_neurips_style()\n",
    "    \n",
    "    # Sort models by F1 score, select top 15, and remove GPT-4o\n",
    "    sorted_data = sorted(results.items(), key=lambda x: x[1]['f1_score'], reverse=True)\n",
    "    sorted_data = [item for item in sorted_data if 'gpt-4o' not in item[0].lower()][:15]\n",
    "    models, data = zip(*sorted_data)\n",
    "    \n",
    "    f1_scores = [d['f1_score'] for d in data]\n",
    "    instruction_scores = [d['instruction_following'] for d in data]\n",
    "    \n",
    "    fig, ax = plt.subplots(figsize=(12, 12))  # Square figure\n",
    "    \n",
    "    # Create scatter plot\n",
    "    scatter = ax.scatter(f1_scores, instruction_scores, s=100, alpha=0.7)\n",
    "    \n",
    "    # Add labels for each point\n",
    "    for i, model in enumerate(models):\n",
    "        cleaned_name = clean_model_name(model)\n",
    "        ax.annotate(cleaned_name, (f1_scores[i], instruction_scores[i]), \n",
    "                    xytext=(-5, 0), textcoords='offset points', fontsize=8, \n",
    "                    fontweight='bold' if 'med' in model.lower() else 'normal',\n",
    "                    ha='right', va='center')\n",
    "    \n",
    "    # Set the top performers quadrant\n",
    "    quadrant_start = 0.75\n",
    "    ax.add_patch(Rectangle((quadrant_start, quadrant_start), 1-quadrant_start, 1-quadrant_start, \n",
    "                           fill=True, facecolor='lightgreen', edgecolor='green', \n",
    "                           alpha=0.2, linestyle='--', linewidth=2))\n",
    "    ax.text(0.76, 0.99, 'Best Performers', fontsize=12, \n",
    "            color='darkgreen', fontweight='bold', va='top')\n",
    "    \n",
    "    # Set labels and title\n",
    "    ax.set_xlabel('F1 Score', fontsize=14)\n",
    "    ax.set_ylabel('Instruction Following Score', fontsize=14)\n",
    "    ax.set_title('Top 15 Models: F1 Score vs Instruction Following', fontsize=18, fontweight='bold')\n",
    "    \n",
    "    # Set consistent axis limits and ticks\n",
    "    min_value = min(min(f1_scores), min(instruction_scores))\n",
    "    max_value = max(max(f1_scores), max(instruction_scores))\n",
    "    axis_min = max(0, round(min_value - 0.05, 1))  # Round to 1 decimal place, but not less than 0\n",
    "    axis_max = min(1, round(max_value + 0.05, 1))  # Round to 1 decimal place, but not more than 1\n",
    "    \n",
    "    ax.set_xlim(axis_min, axis_max)\n",
    "    ax.set_ylim(axis_min, axis_max)\n",
    "    \n",
    "    # Set consistent ticks\n",
    "    ticks = np.arange(axis_min, axis_max + 0.1, 0.1)  # +0.1 to include the max value\n",
    "    ax.set_xticks(ticks)\n",
    "    ax.set_yticks(ticks)\n",
    "    \n",
    "    # Add gridlines\n",
    "    ax.grid(True, linestyle='--', alpha=0.7)\n",
    "    \n",
    "    # Add diagonal line\n",
    "    ax.plot([0, 1], [0, 1], transform=ax.transAxes, ls='--', c='gray')\n",
    "    \n",
    "    # Color points based on whether they're medical models\n",
    "    colors = ['darkblue' if 'med' in model.lower() else 'lightblue' for model in models]\n",
    "    for i, color in enumerate(colors):\n",
    "        scatter.set_facecolors(colors)\n",
    "    \n",
    "    # Create legend\n",
    "    legend_elements = [plt.Line2D([0], [0], marker='o', color='w', label='Non-medical Models',\n",
    "                                  markerfacecolor='lightblue', markersize=10),\n",
    "                       plt.Line2D([0], [0], marker='o', color='w', label='Medical Models',\n",
    "                                  markerfacecolor='darkblue', markersize=10)]\n",
    "    ax.legend(handles=legend_elements, loc='lower right', fontsize=10)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'top_15_models_scatter.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'top_15_models_scatter.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close(fig)\n",
    "\n",
    "# Main execution\n",
    "if __name__ == \"__main__\":\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    PLOT_DIR = ensure_plot_dir(BASE_DIR)\n",
    "    \n",
    "    # Load results with F1 scores and instruction following scores\n",
    "    results = load_results_with_f1(RESULTS_DIR)\n",
    "    \n",
    "    # Plot top 15 models scatter plot\n",
    "    plot_top_15_models_scatter(results, PLOT_DIR)\n",
    "    \n",
    "    print(f\"Top 15 models scatter plot saved in: {PLOT_DIR}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "inputWidgets": {},
     "nuid": "6ad73d56-098c-4b4a-88b4-fc218ba66a12",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Top 15 models scatter plot saved in: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots\n"
     ]
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import numpy as np\n",
    "import os\n",
    "from matplotlib.patches import Rectangle\n",
    "from adjustText import adjust_text\n",
    "\n",
    "def set_neurips_style():\n",
    "    sns.set_style(\"whitegrid\")\n",
    "    plt.rcParams['font.family'] = 'serif'\n",
    "    plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
    "    plt.rcParams['font.size'] = 10\n",
    "    plt.rcParams['axes.labelsize'] = 14\n",
    "    plt.rcParams['axes.titlesize'] = 16\n",
    "    plt.rcParams['xtick.labelsize'] = 12\n",
    "    plt.rcParams['ytick.labelsize'] = 12\n",
    "    plt.rcParams['legend.fontsize'] = 12\n",
    "    plt.rcParams['figure.titlesize'] = 18\n",
    "\n",
    "def clean_model_name(name):\n",
    "    return name.replace('gpt-', '').replace('llama-', '').replace('-chat', '').replace('-instruct', '')\n",
    "\n",
    "def calculate_composite_score(f1_score, instruction_following):\n",
    "    return (f1_score + instruction_following) / 2\n",
    "\n",
    "def plot_top_15_models_scatter(results, plot_dir):\n",
    "    set_neurips_style()\n",
    "    \n",
    "    # Calculate composite scores and sort\n",
    "    sorted_data = [(model, data['f1_score'], data['instruction_following'],\n",
    "                    calculate_composite_score(data['f1_score'], data['instruction_following']))\n",
    "                   for model, data in results.items() if 'gpt-4o' not in model.lower()]\n",
    "    sorted_data.sort(key=lambda x: x[3], reverse=True)\n",
    "    top_15 = sorted_data[:15]\n",
    "    \n",
    "    models, f1_scores, instruction_scores, composite_scores = zip(*top_15)\n",
    "    \n",
    "    fig, ax = plt.subplots(figsize=(14, 14))  # Larger square figure\n",
    "    \n",
    "    # Create scatter plot\n",
    "    scatter = ax.scatter(f1_scores, instruction_scores, s=100, alpha=0.7)\n",
    "    \n",
    "    # Prepare texts for adjustment\n",
    "    texts = []\n",
    "    for i, model in enumerate(models):\n",
    "        cleaned_name = clean_model_name(model)\n",
    "        texts.append(ax.text(f1_scores[i], instruction_scores[i], \n",
    "                             f\"{cleaned_name}\\n(CS: {composite_scores[i]:.2f})\", \n",
    "                             fontsize=10, fontweight='bold' if 'med' in model.lower() else 'normal'))\n",
    "    \n",
    "    # Adjust text positions to prevent overlap\n",
    "    adjust_text(texts, arrowprops=dict(arrowstyle='-', color='gray', lw=0.5))\n",
    "    \n",
    "    # Set the top performers quadrant\n",
    "    quadrant_start = 0.75\n",
    "    ax.add_patch(Rectangle((quadrant_start, quadrant_start), 1-quadrant_start, 1-quadrant_start, \n",
    "                           fill=True, facecolor='lightgreen', edgecolor='green', \n",
    "                           alpha=0.2, linestyle='--', linewidth=2))\n",
    "    ax.text(0.76, 0.99, 'Best Performers', fontsize=14, \n",
    "            color='darkgreen', fontweight='bold', va='top')\n",
    "    \n",
    "    # Set labels and title\n",
    "    ax.set_xlabel('F1 Score', fontsize=16)\n",
    "    ax.set_ylabel('Instruction Following Score', fontsize=16)\n",
    "    ax.set_title('Top 15 Models by Composite Score: F1 Score vs Instruction Following', fontsize=20, fontweight='bold')\n",
    "    \n",
    "    # Set axis limits\n",
    "    ax.set_xlim(0.5, 1.0)\n",
    "    ax.set_ylim(0.5, 1.0)\n",
    "    \n",
    "    # Set ticks\n",
    "    ticks = np.arange(0.5, 1.01, 0.1)\n",
    "    ax.set_xticks(ticks)\n",
    "    ax.set_yticks(ticks)\n",
    "    \n",
    "    # Add gridlines\n",
    "    ax.grid(True, linestyle='--', alpha=0.7)\n",
    "    \n",
    "    # Add diagonal line\n",
    "    ax.plot([0.5, 1], [0.5, 1], ls='--', c='gray')\n",
    "    \n",
    "    # Color points based on whether they're medical models\n",
    "    colors = ['darkblue' if 'med' in model.lower() else 'lightblue' for model in models]\n",
    "    for i, color in enumerate(colors):\n",
    "        scatter.set_facecolors(colors)\n",
    "    \n",
    "    # Create legend\n",
    "    legend_elements = [plt.Line2D([0], [0], marker='o', color='w', label='Non-medical Models',\n",
    "                                  markerfacecolor='lightblue', markersize=10),\n",
    "                       plt.Line2D([0], [0], marker='o', color='w', label='Medical Models',\n",
    "                                  markerfacecolor='darkblue', markersize=10)]\n",
    "    ax.legend(handles=legend_elements, loc='lower right', fontsize=12)\n",
    "    \n",
    "    plt.tight_layout()\n",
    "    plt.savefig(os.path.join(plot_dir, 'top_15_models_composite_scatter_improved.pdf'), dpi=300, bbox_inches='tight')\n",
    "    plt.savefig(os.path.join(plot_dir, 'top_15_models_composite_scatter_improved.png'), dpi=300, bbox_inches='tight')\n",
    "    plt.close(fig)\n",
    "\n",
    "\n",
    "# Main execution\n",
    "if __name__ == \"__main__\":\n",
    "    BASE_DIR = \"/Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/\"\n",
    "    RESULTS_DIR = os.path.join(BASE_DIR, \"model_results\")\n",
    "    PLOT_DIR = ensure_plot_dir(BASE_DIR)\n",
    "    \n",
    "    # Load results with F1 scores and instruction following scores\n",
    "    results = load_results_with_f1(RESULTS_DIR)\n",
    "    \n",
    "    # Plot top 15 models scatter plot\n",
    "    plot_top_15_models_scatter(results, PLOT_DIR)\n",
    "    \n",
    "    print(f\"Top 15 models scatter plot saved in: {PLOT_DIR}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 0,
   "metadata": {
    "application/vnd.databricks.v1+cell": {
     "cellMetadata": {
      "byteLimit": 2048000,
      "rowLimit": 10000
     },
     "collapsed": true,
     "inputWidgets": {},
     "nuid": "a3295a6e-24c8-4168-8b6a-a6a28853ea25",
     "showTitle": false,
     "title": ""
    }
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\u001B[43mNote: you may need to restart the kernel using dbutils.library.restartPython() to use updated packages.\u001B[0m\nRequirement already satisfied: PyPDF2 in /local_disk0/.ephemeral_nfs/envs/pythonEnv-7183bb06-8be9-4a05-a076-028536914efd/lib/python3.10/site-packages (3.0.1)\n\u001B[43mNote: you may need to restart the kernel using dbutils.library.restartPython() to use updated packages.\u001B[0m\nAll plots have been merged into: /Workspace/Users/vurgunu@pennmedicine.upenn.edu/IHCA/plots/IHCA_plots_20240823.pdf\n"
     ]
    }
   ],
   "source": [
    "!pip install PyPDF2 \n",
    "import PyPDF2\n",
    "from datetime import date\n",
    "\n",
    "def concatenate_pdfs(plot_dir):\n",
    "    # Get today's date\n",
    "    today = date.today().strftime(\"%Y%m%d\")\n",
    "    \n",
    "    # Create a PDF merger object\n",
    "    merger = PyPDF2.PdfMerger()\n",
    "    \n",
    "    # List all PDF files in the plot directory\n",
    "    pdf_files = [f for f in os.listdir(plot_dir) if f.endswith('.pdf')]\n",
    "    \n",
    "    # Add each PDF to the merger\n",
    "    for pdf in pdf_files:\n",
    "        merger.append(os.path.join(plot_dir, pdf))\n",
    "    \n",
    "    # Create the output filename\n",
    "    output_filename = f\"IHCA_plots_{today}.pdf\"\n",
    "    output_path = os.path.join(plot_dir, output_filename)\n",
    "    \n",
    "    # Write the merged PDF to the output file\n",
    "    with open(output_path, 'wb') as output_file:\n",
    "        merger.write(output_file)\n",
    "    \n",
    "    print(f\"All plots have been merged into: {output_path}\")\n",
    "\n",
    "# After generating all plots, call the concatenate_pdfs function\n",
    "concatenate_pdfs(PLOT_DIR)"
   ]
  }
 ],
 "metadata": {
  "application/vnd.databricks.v1+notebook": {
   "dashboards": [],
   "environmentMetadata": null,
   "language": "python",
   "notebookMetadata": {
    "pythonIndentUnit": 4
   },
   "notebookName": "xxxx_for the priority dataset (template for other open models)",
   "widgets": {}
  }
 },
 "nbformat": 4,
 "nbformat_minor": 0
}
