{
  "cells": [
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "eFUaP3XP3yE9"
      },
      "outputs": [],
      "source": [
        "# =========================================\n",
        "# MIMIC-IV: AKI causal inference with Notes (LLM hook, single-file)\n",
        "# =========================================\n",
        "from __future__ import annotations\n",
        "\n",
        "# Imports\n",
        "import os, re, json, time, math, datetime as dt\n",
        "import numpy as np\n",
        "import pandas as pd\n",
        "from google.colab import drive\n",
        "import statsmodels.api as sm\n",
        "import matplotlib.pyplot as plt\n",
        "from pathlib import Path\n",
        "from sklearn.linear_model import LogisticRegression\n",
        "import gc"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "8dmcf_6O9aZ8",
        "outputId": "459e930d-c852-4803-d535-961b919a4eea"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Collecting lifelines\n",
            "  Downloading lifelines-0.30.0-py3-none-any.whl.metadata (3.2 kB)\n",
            "Requirement already satisfied: numpy>=1.14.0 in /usr/local/lib/python3.12/dist-packages (from lifelines) (2.0.2)\n",
            "Requirement already satisfied: scipy>=1.7.0 in /usr/local/lib/python3.12/dist-packages (from lifelines) (1.16.1)\n",
            "Requirement already satisfied: pandas>=2.1 in /usr/local/lib/python3.12/dist-packages (from lifelines) (2.2.2)\n",
            "Requirement already satisfied: matplotlib>=3.0 in /usr/local/lib/python3.12/dist-packages (from lifelines) (3.10.0)\n",
            "Requirement already satisfied: autograd>=1.5 in /usr/local/lib/python3.12/dist-packages (from lifelines) (1.8.0)\n",
            "Collecting autograd-gamma>=0.3 (from lifelines)\n",
            "  Downloading autograd-gamma-0.5.0.tar.gz (4.0 kB)\n",
            "  Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "Collecting formulaic>=0.2.2 (from lifelines)\n",
            "  Downloading formulaic-1.2.0-py3-none-any.whl.metadata (7.0 kB)\n",
            "Collecting interface-meta>=1.2.0 (from formulaic>=0.2.2->lifelines)\n",
            "  Downloading interface_meta-1.3.0-py3-none-any.whl.metadata (6.7 kB)\n",
            "Requirement already satisfied: narwhals>=1.17 in /usr/local/lib/python3.12/dist-packages (from formulaic>=0.2.2->lifelines) (2.1.2)\n",
            "Requirement already satisfied: typing-extensions>=4.2.0 in /usr/local/lib/python3.12/dist-packages (from formulaic>=0.2.2->lifelines) (4.14.1)\n",
            "Requirement already satisfied: wrapt>=1.0 in /usr/local/lib/python3.12/dist-packages (from formulaic>=0.2.2->lifelines) (1.17.3)\n",
            "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (1.3.3)\n",
            "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (0.12.1)\n",
            "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (4.59.1)\n",
            "Requirement already satisfied: kiwisolver>=1.3.1 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (1.4.9)\n",
            "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (25.0)\n",
            "Requirement already satisfied: pillow>=8 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (11.3.0)\n",
            "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (3.2.3)\n",
            "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.12/dist-packages (from matplotlib>=3.0->lifelines) (2.9.0.post0)\n",
            "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.12/dist-packages (from pandas>=2.1->lifelines) (2025.2)\n",
            "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.12/dist-packages (from pandas>=2.1->lifelines) (2025.2)\n",
            "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.12/dist-packages (from python-dateutil>=2.7->matplotlib>=3.0->lifelines) (1.17.0)\n",
            "Downloading lifelines-0.30.0-py3-none-any.whl (349 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m349.3/349.3 kB\u001b[0m \u001b[31m6.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading formulaic-1.2.0-py3-none-any.whl (117 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m117.2/117.2 kB\u001b[0m \u001b[31m15.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading interface_meta-1.3.0-py3-none-any.whl (14 kB)\n",
            "Building wheels for collected packages: autograd-gamma\n",
            "  Building wheel for autograd-gamma (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "  Created wheel for autograd-gamma: filename=autograd_gamma-0.5.0-py3-none-any.whl size=4030 sha256=bcd1df76fb8b7a2d5915d1390794276134b4d542ac536ce3d8efd3121df4e9b5\n",
            "  Stored in directory: /root/.cache/pip/wheels/50/37/21/0a719b9d89c635e89ff24bd93b862882ad675279552013b2fb\n",
            "Successfully built autograd-gamma\n",
            "Installing collected packages: interface-meta, autograd-gamma, formulaic, lifelines\n",
            "Successfully installed autograd-gamma-0.5.0 formulaic-1.2.0 interface-meta-1.3.0 lifelines-0.30.0\n"
          ]
        }
      ],
      "source": [
        "#!pip install lifelines"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "m1apKexu354k"
      },
      "outputs": [],
      "source": [
        "try:\n",
        "    from lifelines import CoxPHFitter\n",
        "except Exception:\n",
        "    CoxPHFitter = None"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "clIh6htK371d"
      },
      "outputs": [],
      "source": [
        "!pip install python-dotenv -q\n",
        "from dotenv import load_dotenv\n",
        "from __future__ import annotations"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "b5QOXD8R3_iq",
        "outputId": "53d620bd-cdee-4cc0-d908-f92bcc14f39d"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Mounted at /content/drive\n"
          ]
        },
        {
          "data": {
            "text/plain": [
              "True"
            ]
          },
          "execution_count": 5,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "drive.mount('/content/drive')\n",
        "drive_path = '/content/drive/MyDrive/'\n",
        "load_dotenv(drive_path + 'Colab Notebooks/env_config/.env')"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "3Js0sNM844bA"
      },
      "outputs": [],
      "source": [
        "# ---------- Config ----------\n",
        "pd.set_option(\"display.max_rows\", 8)\n",
        "MIMIC_DIR = Path(\"/content/drive/MyDrive/data/mimiciv/3.1/\")  # <- 경로 맞게 수정\n",
        "HOSP = MIMIC_DIR / \"hosp\"\n",
        "NOTE = MIMIC_DIR / \"note\"\n",
        "OUTD = Path(\"/content/drive/MyDrive/results_ci\"); OUTD.mkdir(parents=True, exist_ok=True)\n",
        "\n",
        "# 큰 csv.gz는 청크로\n",
        "READ_KW = dict(dtype_backend=\"pyarrow\", low_memory=False)\n",
        "\n",
        "# Causal / modeling\n",
        "RANDOM_STATE   = 7\n",
        "PS_CLIP        = (1e-3, 1-1e-3)\n",
        "W_TRIM         = (0.01, 0.99)\n",
        "VPT_WINDOW_HOURS = 6\n",
        "COX_PENALIZER  = 0.1\n",
        "\n",
        "# Regex / patterns\n",
        "RX_SCR_LABEL = \"creatinine\"                  # simple substring (no regex)\n",
        "RX_SCR_FLUID = r\"\\b(?:serum|blood)\\b\"        # regex\n",
        "RX_MGDL      = r\"\\bmg/dl\\b\"\n",
        "RX_MGL       = r\"\\bmg/l\\b\"\n",
        "RX_VANCO_SUB = \"vancomycin\"\n",
        "RX_PTZ       = r\"(?:piperacillin|tazobactam|zosyn)\"\n",
        "RX_EMERG_SUB = \"EMER\"\n",
        "\n",
        "# LLM confounders (배치 출력이 제공하는 키)\n",
        "CONFOUNDERS = [\"f_ckd_pre\", \"f_dm_pre\", \"f_hf_pre\", \"f_liver_pre\", \"f_nephrotox_pre\"]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "6hFLw0iy4854"
      },
      "outputs": [],
      "source": [
        "# =========================\n",
        "# Utils\n",
        "# =========================\n",
        "def _to_datetime_safe(s: pd.Series, fmt: str | None = \"%Y-%m-%d %H:%M:%S\") -> pd.Series:\n",
        "    x = pd.to_datetime(s, errors=\"coerce\", format=fmt)\n",
        "    if x.isna().any():\n",
        "        y = pd.to_datetime(s[x.isna()], errors=\"coerce\")\n",
        "        x.loc[x.isna()] = y\n",
        "    return x\n",
        "\n",
        "def _smd(x, t, w=None):\n",
        "    x = np.asarray(x, float); t = np.asarray(t, int)\n",
        "    if w is None: w = np.ones_like(t, float)\n",
        "    if (t==1).sum()==0 or (t==0).sum()==0: return np.nan\n",
        "    m1 = np.average(x[t==1], weights=w[t==1]); m0 = np.average(x[t==0], weights=w[t==0])\n",
        "    v1 = np.average((x[t==1]-m1)**2, weights=w[t==1]); v0 = np.average((x[t==0]-m0)**2, weights=w[t==0])\n",
        "    return (m1-m0)/np.sqrt((v1+v0)/2 + 1e-9)\n",
        "\n",
        "def evalue_from_hr(hr, lcl, ucl):\n",
        "    def _ev(x: float) -> float:\n",
        "        return x + math.sqrt(max(x,0)*(max(x,0)-1.0)) if x>1 else 1.0\n",
        "    return (_ev(float(hr)), _ev(float(lcl)) if float(lcl)>1 else 1.0)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "UOS8PqjC4-4h"
      },
      "outputs": [],
      "source": [
        "# =========================\n",
        "# 1) Treatment cohort (V vs VPT)\n",
        "# =========================\n",
        "def build_cohort(hosp: Path) -> pd.DataFrame:\n",
        "    use_cols = [\"subject_id\",\"hadm_id\",\"starttime\",\"stoptime\",\"drug\"]\n",
        "    it = pd.read_csv(hosp/\"prescriptions.csv.gz\",\n",
        "                     usecols=lambda c: c in use_cols,\n",
        "                     chunksize=500_000, low_memory=False)\n",
        "    v_chunks, p_chunks = [], []\n",
        "\n",
        "    for ch in it:\n",
        "        ch[\"starttime\"] = _to_datetime_safe(ch[\"starttime\"])\n",
        "        ch[\"stoptime\"]  = _to_datetime_safe(ch[\"stoptime\"])\n",
        "        dlow = ch[\"drug\"].astype(\"string\").str.lower()\n",
        "\n",
        "        v = ch[dlow.str.contains(RX_VANCO_SUB, na=False, regex=False)]\n",
        "        p = ch[dlow.str.contains(RX_PTZ,       na=False, regex=True)]\n",
        "\n",
        "        v = v.rename(columns={\"starttime\":\"v_start\",\"stoptime\":\"v_stop\"})\n",
        "        p = p.rename(columns={\"starttime\":\"p_start\",\"stoptime\":\"p_stop\"})\n",
        "        v_chunks.append(v[[\"subject_id\",\"hadm_id\",\"v_start\",\"v_stop\"]])\n",
        "        p_chunks.append(p[[\"subject_id\",\"hadm_id\",\"p_start\",\"p_stop\"]])\n",
        "\n",
        "    vanco = pd.concat(v_chunks, ignore_index=True) if v_chunks else \\\n",
        "            pd.DataFrame(columns=[\"subject_id\",\"hadm_id\",\"v_start\",\"v_stop\"])\n",
        "    ptz   = pd.concat(p_chunks, ignore_index=True) if p_chunks else \\\n",
        "            pd.DataFrame(columns=[\"subject_id\",\"hadm_id\",\"p_start\",\"p_stop\"])\n",
        "\n",
        "    v1 = (vanco.sort_values(\"v_start\")\n",
        "                .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "                .agg(index_time=(\"v_start\",\"first\")))\n",
        "    p1 = (ptz.sort_values(\"p_start\")\n",
        "              .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "              .agg(ptz_time=(\"p_start\",\"first\")))\n",
        "\n",
        "    v1[\"index_time\"] = _to_datetime_safe(v1[\"index_time\"])\n",
        "    p1[\"ptz_time\"]   = _to_datetime_safe(p1[\"ptz_time\"])\n",
        "\n",
        "    cohort = v1.merge(p1, how=\"left\", on=[\"subject_id\",\"hadm_id\"])\n",
        "    cohort = cohort.dropna(subset=[\"index_time\"]).reset_index(drop=True)\n",
        "\n",
        "    # STRICT: ptz_time within +6h\n",
        "    cohort[\"vpt_flag\"] = (\n",
        "        cohort[\"ptz_time\"].notna() &\n",
        "        (cohort[\"ptz_time\"] >= cohort[\"index_time\"]) &\n",
        "        (cohort[\"ptz_time\"] <= cohort[\"index_time\"] + pd.Timedelta(hours=VPT_WINDOW_HOURS))\n",
        "    ).astype(int)\n",
        "\n",
        "    for k in (\"subject_id\",\"hadm_id\"):\n",
        "        cohort[k] = cohort[k].astype(\"Int64\")\n",
        "\n",
        "    print(f\"[cohort] N={len(cohort)}  VPT={int(cohort['vpt_flag'].sum())}\")\n",
        "    return cohort"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "7Sh4x86O5CEZ"
      },
      "outputs": [],
      "source": [
        "# =========================\n",
        "# 2) Labs → SCr & AKI labels\n",
        "# =========================\n",
        "def load_scr_itemids(hosp: Path) -> list[int]:\n",
        "    d_lab = pd.read_csv(hosp/\"d_labitems.csv.gz\", **READ_KW)\n",
        "    mask = (\n",
        "        d_lab[\"label\"].astype(\"string\").str.contains(RX_SCR_LABEL, na=False, regex=False, case=False) &\n",
        "        d_lab[\"fluid\"].astype(\"string\").str.contains(RX_SCR_FLUID, na=False, regex=True, case=False)\n",
        "    )\n",
        "    ids = d_lab.loc[mask, \"itemid\"].dropna().astype(\"Int64\").astype(int).unique().tolist()\n",
        "    if len(ids) == 0:\n",
        "        mask2 = d_lab[\"label\"].astype(\"string\").str.contains(RX_SCR_LABEL, na=False, regex=False, case=False)\n",
        "        ids = d_lab.loc[mask2, \"itemid\"].dropna().astype(\"Int64\").astype(int).unique().tolist()\n",
        "\n",
        "    print(f\"[scr ids] K={len(ids)}  sample: {ids[:3]}\")\n",
        "    return ids\n",
        "\n",
        "def load_scr_timeseries(hosp: Path, cohort: pd.DataFrame, scr_ids: list[int]) -> pd.DataFrame:\n",
        "    if len(scr_ids)==0:\n",
        "        raise RuntimeError(\"No SCr itemids found. Check d_labitems.csv.gz filters.\")\n",
        "\n",
        "    hadm_set = set(cohort[\"hadm_id\"].dropna().astype(int).unique().tolist())\n",
        "    keep = [\"subject_id\",\"hadm_id\",\"itemid\",\"charttime\",\"valuenum\",\"valueuom\"]\n",
        "\n",
        "    it = pd.read_csv(hosp/\"labevents.csv.gz\",\n",
        "                     usecols=lambda c: c in keep,\n",
        "                     chunksize=1_000_000, low_memory=False)\n",
        "    chunks=[]\n",
        "    for ch in it:\n",
        "        ch = ch[ch[\"itemid\"].isin(scr_ids)]\n",
        "        ch = ch[ch[\"hadm_id\"].isin(hadm_set)]\n",
        "        if len(ch)==0:\n",
        "            continue\n",
        "        ch[\"charttime\"] = _to_datetime_safe(ch[\"charttime\"])\n",
        "\n",
        "        u = ch[\"valueuom\"].astype(\"string\").str.lower()\n",
        "        ch[\"scr_mgdl\"] = ch[\"valuenum\"]\n",
        "\n",
        "        m_mgl  = u.str.contains(RX_MGL,  na=False, regex=True)\n",
        "        m_mgdl = u.str.contains(RX_MGDL, na=False, regex=True)\n",
        "\n",
        "        ch.loc[m_mgl, \"scr_mgdl\"] = ch.loc[m_mgl, \"valuenum\"] / 10.0\n",
        "        ch = ch[m_mgdl | m_mgl]\n",
        "        if len(ch):\n",
        "            chunks.append(ch[[\"subject_id\",\"hadm_id\",\"itemid\",\"charttime\",\"scr_mgdl\"]])\n",
        "\n",
        "    df = pd.concat(chunks, ignore_index=True) if chunks else \\\n",
        "         pd.DataFrame(columns=[\"subject_id\",\"hadm_id\",\"itemid\",\"charttime\",\"scr_mgdl\"])\n",
        "\n",
        "    df = df.merge(cohort[[\"subject_id\",\"hadm_id\",\"index_time\",\"vpt_flag\"]],\n",
        "                  on=[\"subject_id\",\"hadm_id\"], how=\"inner\")\n",
        "\n",
        "    if len(df)==0:\n",
        "        print(\"[scr ts] rows=0 (no overlapping SCr rows for cohort)\")\n",
        "        return df\n",
        "\n",
        "    df[\"index_time\"] = _to_datetime_safe(df[\"index_time\"])\n",
        "    df = df.dropna(subset=[\"charttime\",\"index_time\"]).reset_index(drop=True)\n",
        "    df[\"dt\"] = (df[\"charttime\"] - df[\"index_time\"]).dt.total_seconds()/3600.0\n",
        "    df = df.sort_values([\"subject_id\",\"hadm_id\",\"charttime\"]).reset_index(drop=True)\n",
        "    for k in (\"subject_id\",\"hadm_id\"):\n",
        "        df[k] = df[k].astype(\"Int64\")\n",
        "    print(f\"[scr ts] rows={len(df)}\")\n",
        "    return df\n",
        "\n",
        "def label_aki(df: pd.DataFrame, cohort: pd.DataFrame) -> pd.DataFrame:\n",
        "    if len(df)==0:\n",
        "        out = cohort.copy()\n",
        "        out[\"baseline\"] = np.nan\n",
        "        out[\"aki48\"] = 0; out[\"aki7x\"] = 0; out[\"aki\"] = 0\n",
        "        print(f\"[aki] rate=0.000  N={len(out)} (no SCr rows)\")\n",
        "        return out\n",
        "\n",
        "    base = (df[(df[\"dt\"]>=-24) & (df[\"dt\"]<=0)]\n",
        "              .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "              .agg(baseline=(\"scr_mgdl\",\"median\")))\n",
        "    out = cohort.merge(base, on=[\"subject_id\",\"hadm_id\"], how=\"left\")\n",
        "\n",
        "    if out[\"baseline\"].isna().any():\n",
        "        first24 = (df[(df[\"dt\"]>=0) & (df[\"dt\"]<=24)]\n",
        "                     .sort_values(\"charttime\")\n",
        "                     .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "                     .agg(first24=(\"scr_mgdl\",\"first\")))\n",
        "        out = out.merge(first24, on=[\"subject_id\",\"hadm_id\"], how=\"left\")\n",
        "        out[\"baseline\"] = out[\"baseline\"].fillna(out[\"first24\"])\n",
        "\n",
        "    p48 = (df[(df[\"dt\"]>0) & (df[\"dt\"]<=48)]\n",
        "             .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "             .agg(max48=(\"scr_mgdl\",\"max\")))\n",
        "    p7d = (df[(df[\"dt\"]>0) & (df[\"dt\"]<=24*7)]\n",
        "             .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "             .agg(max7=(\"scr_mgdl\",\"max\")))\n",
        "\n",
        "    out = out.merge(p48, on=[\"subject_id\",\"hadm_id\"], how=\"left\") \\\n",
        "             .merge(p7d, on=[\"subject_id\",\"hadm_id\"], how=\"left\")\n",
        "\n",
        "    out[\"aki48\"] = (out[\"max48\"] >= (out[\"baseline\"] + 0.3)).astype(int)\n",
        "    out[\"aki7x\"] = (out[\"max7\"]  >= (1.5 * out[\"baseline\"])).astype(int)\n",
        "    out[\"aki\"]   = ((out[\"aki48\"]==1) | (out[\"aki7x\"]==1)).astype(int)\n",
        "\n",
        "    print(f\"[aki] rate={out['aki'].mean():.3f}  N={len(out)}\")\n",
        "    return out"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "B0OElzul4Dxb"
      },
      "outputs": [],
      "source": [
        "# =========================\n",
        "# 3) Time-to-event window (≤7d)\n",
        "# =========================\n",
        "def build_event_times(df_scr: pd.DataFrame, out: pd.DataFrame, hosp: Path) -> pd.DataFrame:\n",
        "    adm = pd.read_csv(hosp/\"admissions.csv.gz\",\n",
        "                      usecols=[\"subject_id\",\"hadm_id\",\"admittime\",\"dischtime\"],\n",
        "                      parse_dates=[\"admittime\",\"dischtime\"], **READ_KW)\n",
        "    adm[\"admittime\"] = _to_datetime_safe(adm[\"admittime\"])\n",
        "    adm[\"dischtime\"] = _to_datetime_safe(adm[\"dischtime\"])\n",
        "\n",
        "    if len(df_scr)==0:\n",
        "        evt = out[[\"subject_id\",\"hadm_id\",\"index_time\",\"vpt_flag\"]].copy()\n",
        "        evt[\"event_time_48\"] = pd.NaT\n",
        "        evt[\"event_time_7\"]  = pd.NaT\n",
        "        evt[\"event_time\"]    = pd.NaT\n",
        "    else:\n",
        "        tmp48 = (df_scr[(df_scr[\"dt\"]>0) & (df_scr[\"dt\"]<=48)]\n",
        "                 .merge(out[[\"subject_id\",\"hadm_id\",\"baseline\"]],\n",
        "                        on=[\"subject_id\",\"hadm_id\"], how=\"left\"))\n",
        "        hit48 = tmp48[tmp48[\"scr_mgdl\"] >= (tmp48[\"baseline\"] + 0.3)]\n",
        "        ev48 = (hit48.sort_values(\"charttime\")\n",
        "                     .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "                     .first()[[\"subject_id\",\"hadm_id\",\"charttime\"]]\n",
        "                     .rename(columns={\"charttime\":\"event_time_48\"}))\n",
        "\n",
        "        tmp7 = (df_scr[(df_scr[\"dt\"]>0) & (df_scr[\"dt\"]<=24*7)]\n",
        "                .merge(out[[\"subject_id\",\"hadm_id\",\"baseline\"]],\n",
        "                       on=[\"subject_id\",\"hadm_id\"], how=\"left\"))\n",
        "        hit7 = tmp7[tmp7[\"scr_mgdl\"] >= (1.5 * tmp7[\"baseline\"])]\n",
        "        ev7 = (hit7.sort_values(\"charttime\")\n",
        "                   .groupby([\"subject_id\",\"hadm_id\"], as_index=False)\n",
        "                   .first()[[\"subject_id\",\"hadm_id\",\"charttime\"]]\n",
        "                   .rename(columns={\"charttime\":\"event_time_7\"}))\n",
        "\n",
        "        evt = (out[[\"subject_id\",\"hadm_id\",\"index_time\",\"vpt_flag\"]]\n",
        "               .merge(ev48, how=\"left\")\n",
        "               .merge(ev7,  how=\"left\"))\n",
        "        evt[\"event_time\"] = evt[[\"event_time_48\",\"event_time_7\"]].min(axis=1)\n",
        "\n",
        "    evt = evt.merge(adm, on=[\"subject_id\",\"hadm_id\"], how=\"left\")\n",
        "    evt[\"censor_limit\"] = evt[\"index_time\"] + pd.Timedelta(days=7)\n",
        "    evt[\"censor_time\"]  = evt[[\"dischtime\",\"censor_limit\"]].min(axis=1)\n",
        "\n",
        "    evt = evt.dropna(subset=[\"index_time\",\"censor_time\"]).reset_index(drop=True)\n",
        "    evt[\"event_observed\"] = (evt[\"event_time\"].notna()) & (evt[\"event_time\"] <= evt[\"censor_time\"])\n",
        "    evt[\"duration_days\"] = (\n",
        "        np.where(\n",
        "            evt[\"event_observed\"],\n",
        "            (evt[\"event_time\"] - evt[\"index_time\"]).dt.total_seconds(),\n",
        "            (evt[\"censor_time\"] - evt[\"index_time\"]).dt.total_seconds()\n",
        "        ) / 86400.0\n",
        "    ).clip(min=0)\n",
        "\n",
        "    for k in (\"subject_id\",\"hadm_id\"):\n",
        "        evt[k] = evt[k].astype(\"Int64\")\n",
        "\n",
        "    print(f\"[tte] rows={len(evt)} events={int(evt['event_observed'].sum())}\")\n",
        "    return evt"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "xXtmijAL4K_J"
      },
      "outputs": [],
      "source": [
        "def run_pipeline_with_batch_features(HOSP: Path, NOTE: Path, df_outputs: pd.DataFrame):\n",
        "    # 1) Cohort\n",
        "    cohort = build_cohort(HOSP)\n",
        "\n",
        "    # 2) Labs → AKI\n",
        "    scr_ids = load_scr_itemids(HOSP)\n",
        "    df_scr  = load_scr_timeseries(HOSP, cohort, scr_ids)\n",
        "    out     = label_aki(df_scr, cohort)\n",
        "\n",
        "    # 3) TTE\n",
        "    evt = build_event_times(df_scr, out, HOSP)\n",
        "\n",
        "    # 4) (변경) 배치 결과에서 confounder 피처 직접 생성\n",
        "    note_feat = llm_features_from_batch_outputs(df_outputs)\n",
        "\n",
        "    # 5) Covariates\n",
        "    dfc = build_covariates(HOSP, out, note_feat)\n",
        "    dfc = dfc.merge(evt[[\"subject_id\",\"hadm_id\",\"duration_days\",\"event_observed\"]],\n",
        "                    on=[\"subject_id\",\"hadm_id\"], how=\"left\")\n",
        "    dfc = dfc.dropna(subset=[\"vpt_flag\",\"aki\",\"duration_days\",\"event_observed\"]).reset_index(drop=True)\n",
        "\n",
        "    print(f\"[analytic] N={len(dfc)}  events={int(dfc['event_observed'].sum())}  treated={int(dfc['vpt_flag'].sum())}\")\n",
        "\n",
        "    # 6) Evaluate BASE vs BASE+LLM\n",
        "    base_covs = [\"age\",\"sexM\",\"is_emerg\",\"baseline\"]\n",
        "    llm_covs  = base_covs + [c for c in CONFOUNDERS if c in dfc.columns]\n",
        "\n",
        "    m_base = evaluate_covset(dfc, base_covs, \"BASE\")\n",
        "    m_llm  = evaluate_covset(dfc, llm_covs,  \"BASE+LLM\")\n",
        "\n",
        "    perf = pd.DataFrame([m_base, m_llm])\n",
        "    perf.to_csv(OUTD/\"perf_base_vs_llm.csv\", index=False)\n",
        "\n",
        "    print(\"\\n=== Performance (BASE vs BASE+LLM) ===\")\n",
        "    cols_show = [\n",
        "        \"covset\",\"k_covs\",\n",
        "        \"mean_abs_SMD_before\",\"mean_abs_SMD_after\",\n",
        "        \"ESS\",\"KS_PS\",\n",
        "        \"IPTW_HR\",\"IPTW_LCL\",\"IPTW_UCL\",\n",
        "        \"DR_HR\",\"DR_LCL\",\"DR_UCL\",\n",
        "        \"Evalue_point\",\"Evalue_CI\"\n",
        "    ]\n",
        "    print(perf[cols_show])\n",
        "    print(f\"[saved] {OUTD/'perf_base_vs_llm.csv'}\")\n",
        "\n",
        "    return dfc, perf\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "AO6LG4405H79"
      },
      "outputs": [],
      "source": [
        "# =========================\n",
        "# 4) Batch outputs → note features (NO LLM calls)\n",
        "# =========================\n",
        "def _split_custom_id(custom_id: str) -> tuple[int|None, int|None]:\n",
        "    \"\"\"\n",
        "    기대 형식: '10000032_22595853' → (10000032, 22595853)\n",
        "    \"\"\"\n",
        "    if not isinstance(custom_id, str):\n",
        "        return (None, None)\n",
        "    s = custom_id.strip()\n",
        "    if not s or \"_\" not in s:\n",
        "        return (None, None)\n",
        "    a, b = s.split(\"_\", 1)\n",
        "    return (int(a), int(b)) if (a.isdigit() and b.isdigit()) else (None, None)\n",
        "\n",
        "def _parse_json_safely(s: str) -> dict:\n",
        "    if s is None or not isinstance(s, str) or not s.strip():\n",
        "        return {}\n",
        "    t = s.strip()\n",
        "    # ```json ... ``` 제거\n",
        "    if t.startswith(\"```\"):\n",
        "        t = re.sub(r\"^```(?:json)?\\s*|\\s*```$\", \"\", t, flags=re.IGNORECASE|re.DOTALL).strip()\n",
        "    # json.loads 우선\n",
        "    try:\n",
        "        return json.loads(t)\n",
        "    except Exception:\n",
        "        pass\n",
        "    # 중괄호 블럭만 추출해서 재시도\n",
        "    m = re.search(r\"\\{.*\\}\", t, flags=re.DOTALL)\n",
        "    if m:\n",
        "        try:\n",
        "            return json.loads(m.group(0))\n",
        "        except Exception:\n",
        "            pass\n",
        "    return {}\n",
        "\n",
        "def llm_features_from_batch_outputs(df_outputs: pd.DataFrame) -> pd.DataFrame:\n",
        "    \"\"\"\n",
        "    df_outputs 필요 컬럼:\n",
        "      - custom_id (형식: '{subject_id}_{hadm_id}')\n",
        "      - assistant_text (JSON 문자열)\n",
        "    선택 필터:\n",
        "      - http_status == 200\n",
        "      - finish_reason == 'stop'\n",
        "      - error isna()\n",
        "    반환: [subject_id, hadm_id] + CONFOUNDERS(0/1)\n",
        "    \"\"\"\n",
        "    need = {\"custom_id\", \"assistant_text\"}\n",
        "    missing = [c for c in need if c not in df_outputs.columns]\n",
        "    if missing:\n",
        "        raise ValueError(f\"df_outputs missing columns: {missing}\")\n",
        "\n",
        "    df = df_outputs.copy()\n",
        "\n",
        "    if \"http_status\" in df.columns:\n",
        "        df = df[df[\"http_status\"] == 200]\n",
        "    if \"finish_reason\" in df.columns:\n",
        "        df = df[df[\"finish_reason\"].astype(str).str.lower() == \"stop\"]\n",
        "    if \"error\" in df.columns:\n",
        "        df = df[df[\"error\"].isna()]\n",
        "\n",
        "    # custom_id → subject/hadm\n",
        "    sid_hadm = df[\"custom_id\"].apply(_split_custom_id)\n",
        "    df[\"subject_id\"] = [p[0] for p in sid_hadm]\n",
        "    df[\"hadm_id\"]    = [p[1] for p in sid_hadm]\n",
        "    df = df[~df[\"hadm_id\"].isna()].copy()\n",
        "\n",
        "    df[\"hadm_id\"] = df[\"hadm_id\"].astype(\"Int64\")\n",
        "    df[\"subject_id\"] = df[\"subject_id\"].astype(\"Int64\")\n",
        "\n",
        "    # assistant_text → confounders\n",
        "    feats = []\n",
        "    for s in df[\"assistant_text\"].astype(str):\n",
        "        obj = _parse_json_safely(s)\n",
        "        row = {}\n",
        "        for k in CONFOUNDERS:\n",
        "            v = obj.get(k, 0)\n",
        "            try:\n",
        "                row[k] = int(v)\n",
        "            except Exception:\n",
        "                row[k] = int(bool(v))\n",
        "        feats.append(row)\n",
        "    df_feat = pd.DataFrame(feats, index=df.index)\n",
        "\n",
        "    out = pd.concat([df[[\"subject_id\",\"hadm_id\"]], df_feat], axis=1)\n",
        "\n",
        "    # (subject, hadm) 중복 시 OR(=max) 집계\n",
        "    agg = {k: \"max\" for k in CONFOUNDERS}\n",
        "    out = (out.groupby([\"subject_id\",\"hadm_id\"], dropna=False, as_index=False)\n",
        "            .agg(agg))\n",
        "\n",
        "    for c in CONFOUNDERS:\n",
        "        out[c] = out[c].fillna(0).astype(int)\n",
        "\n",
        "    # 검증\n",
        "    assert out[\"hadm_id\"].notna().all(), \"hadm_id 누락 행 존재\"\n",
        "    return out"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "be3N8Vax5Kmz"
      },
      "outputs": [],
      "source": [
        "# =========================\n",
        "# 5) Covariates + PS + Survival\n",
        "# =========================\n",
        "def build_covariates(hosp: Path, out: pd.DataFrame, note_feat: pd.DataFrame) -> pd.DataFrame:\n",
        "    adm = pd.read_csv(hosp/\"admissions.csv.gz\",\n",
        "                      usecols=[\"subject_id\",\"hadm_id\",\"admittime\",\"dischtime\",\"admission_type\"],\n",
        "                      parse_dates=[\"admittime\",\"dischtime\"], **READ_KW)\n",
        "    pat = pd.read_csv(hosp/\"patients.csv.gz\",\n",
        "                      usecols=[\"subject_id\",\"gender\",\"anchor_age\"], **READ_KW)\n",
        "    adm[\"admittime\"] = _to_datetime_safe(adm[\"admittime\"])\n",
        "    adm[\"dischtime\"] = _to_datetime_safe(adm[\"dischtime\"])\n",
        "\n",
        "    dfc = (out.merge(adm, on=[\"subject_id\",\"hadm_id\"], how=\"left\")\n",
        "              .merge(pat, on=\"subject_id\", how=\"left\")\n",
        "              .merge(note_feat, on=[\"subject_id\",\"hadm_id\"], how=\"left\"))\n",
        "\n",
        "    dfc[\"age\"]      = pd.to_numeric(dfc[\"anchor_age\"], errors=\"coerce\")\n",
        "    dfc[\"sexM\"]     = (dfc[\"gender\"] == \"M\").astype(int)\n",
        "    dfc[\"is_emerg\"] = dfc[\"admission_type\"].astype(\"string\") \\\n",
        "                        .str.contains(RX_EMERG_SUB, na=False, regex=False).astype(int)\n",
        "\n",
        "    for c in CONFOUNDERS:\n",
        "        if c in dfc.columns: dfc[c] = dfc[c].fillna(0).astype(int)\n",
        "    return dfc\n",
        "\n",
        "def fit_ps_and_sw(dfc: pd.DataFrame, covs: list[str],\n",
        "                  ps_clip=PS_CLIP, w_trim=W_TRIM):\n",
        "    covs = [c for c in dict.fromkeys(covs) if c in dfc.columns]\n",
        "    if not covs:\n",
        "        raise ValueError(\"No covariates provided to fit_ps_and_sw.\")\n",
        "    X = dfc[covs].copy()\n",
        "    for c in covs: X[c] = pd.to_numeric(X[c], errors=\"coerce\")\n",
        "    X = X.fillna(X.median(numeric_only=True))\n",
        "\n",
        "    T = dfc[\"vpt_flag\"].astype(int)\n",
        "    ps_model = LogisticRegression(max_iter=400, solver=\"lbfgs\", random_state=RANDOM_STATE)\n",
        "    ps_model.fit(X, T)\n",
        "    ps = np.clip(ps_model.predict_proba(X)[:,1], *ps_clip)\n",
        "\n",
        "    p_t = float(T.mean())\n",
        "    sw = np.where(T==1, p_t/ps, (1-p_t)/(1-ps))\n",
        "    lo, hi = np.quantile(sw, w_trim); sw = np.clip(sw, lo, hi)\n",
        "\n",
        "    ESS = float((sw.sum()**2)/(sw**2).sum())\n",
        "    return X, ps, sw, ESS\n",
        "\n",
        "def cox_results_ipw_and_dr(dfc: pd.DataFrame, sw: np.ndarray, covs: list[str], penalizer=COX_PENALIZER):\n",
        "    if CoxPHFitter is None:\n",
        "        raise RuntimeError(\"lifelines is not installed.\")\n",
        "    d = pd.DataFrame({\n",
        "        \"time\":  pd.to_numeric(dfc[\"duration_days\"], errors=\"coerce\"),\n",
        "        \"event\": dfc[\"event_observed\"].astype(int),\n",
        "        \"treat\": dfc[\"vpt_flag\"].astype(int),\n",
        "        \"sw\":    sw\n",
        "    }).dropna(subset=[\"time\",\"event\",\"treat\",\"sw\"])\n",
        "\n",
        "    if d[\"event\"].sum() == 0:\n",
        "        raise RuntimeError(\"No events in TTE window; cannot fit Cox model.\")\n",
        "\n",
        "    cph_w = CoxPHFitter(penalizer=penalizer)\n",
        "    cph_w.fit(d, duration_col=\"time\", event_col=\"event\", weights_col=\"sw\", robust=True)\n",
        "    iptw_HR  = float(np.exp(cph_w.params_[\"treat\"]))\n",
        "    iptw_LCL, iptw_UCL = np.exp(cph_w.confidence_intervals_.loc[\"treat\"].values)\n",
        "\n",
        "    X = dfc[covs].copy()\n",
        "    for c in covs: X[c] = pd.to_numeric(X[c], errors=\"coerce\")\n",
        "    X = X.fillna(X.median(numeric_only=True))\n",
        "    d2 = pd.concat([d.reset_index(drop=True), X.reset_index(drop=True)], axis=1)\n",
        "\n",
        "    cph_dr = CoxPHFitter(penalizer=penalizer)\n",
        "    cph_dr.fit(d2, duration_col=\"time\", event_col=\"event\", weights_col=\"sw\", robust=True)\n",
        "    dr_HR  = float(np.exp(cph_dr.params_[\"treat\"]))\n",
        "    dr_LCL, dr_UCL = np.exp(cph_dr.confidence_intervals_.loc[\"treat\"].values)\n",
        "\n",
        "    return (iptw_HR, iptw_LCL, iptw_UCL), (dr_HR, dr_LCL, dr_UCL)\n",
        "\n",
        "def evaluate_covset(dfc: pd.DataFrame, covs: list[str], label=\"BASE\"):\n",
        "    covs = [c for c in dict.fromkeys(covs) if c in dfc.columns]\n",
        "    if not covs: raise ValueError(\"No covariates for evaluate_covset.\")\n",
        "\n",
        "    X, ps, sw, ESS = fit_ps_and_sw(dfc, covs)\n",
        "\n",
        "    T = dfc[\"vpt_flag\"].astype(int).values\n",
        "    smd_b = [abs(_smd(X[c].values, T, None)) for c in X.columns]\n",
        "    smd_a = [abs(_smd(X[c].values, T, sw))  for c in X.columns]\n",
        "    meanSMD_b = float(np.nanmean(smd_b)); meanSMD_a = float(np.nanmean(smd_a))\n",
        "\n",
        "    # KS(PS overlap)\n",
        "    try:\n",
        "        from scipy.stats import ks_2samp\n",
        "        KS = float(ks_2samp(ps[T==1], ps[T==0]).statistic)\n",
        "    except Exception:\n",
        "        grid = np.linspace(0,1,200)\n",
        "        c1 = np.searchsorted(np.sort(ps[T==1]), grid, side=\"right\")/max(1,(T==1).sum())\n",
        "        c0 = np.searchsorted(np.sort(ps[T==0]), grid, side=\"right\")/max(1,(T==0).sum())\n",
        "        KS = float(np.max(np.abs(c1-c0)))\n",
        "\n",
        "    (hr_i,l_i,u_i),(hr_d,l_d,u_d) = cox_results_ipw_and_dr(dfc, sw, covs)\n",
        "    E_point, E_CI = evalue_from_hr(hr_i, l_i, u_i)\n",
        "\n",
        "    return {\n",
        "        \"covset\":label, \"k_covs\":len(covs),\n",
        "        \"mean_abs_SMD_before\":meanSMD_b, \"mean_abs_SMD_after\":meanSMD_a,\n",
        "        \"ESS\":ESS, \"KS_PS\":KS,\n",
        "        \"IPTW_HR\":hr_i, \"IPTW_LCL\":l_i, \"IPTW_UCL\":u_i, \"IPTW_CI_width\":u_i-l_i,\n",
        "        \"DR_HR\":hr_d,   \"DR_LCL\":l_d,  \"DR_UCL\":u_d,  \"DR_CI_width\":u_d-l_d,\n",
        "        \"Evalue_point\":E_point, \"Evalue_CI\":E_CI\n",
        "    }\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "19WUEvFz5NwY"
      },
      "outputs": [],
      "source": [
        "# =========================\n",
        "# 6) Main (Batch features only)\n",
        "# =========================\n",
        "def run_pipeline_with_batch_features(HOSP: Path, NOTE: Path, df_outputs: pd.DataFrame):\n",
        "    # 1) Cohort\n",
        "    cohort = build_cohort(HOSP)\n",
        "\n",
        "    # 2) Labs → AKI\n",
        "    scr_ids = load_scr_itemids(HOSP)\n",
        "    df_scr  = load_scr_timeseries(HOSP, cohort, scr_ids)\n",
        "    out     = label_aki(df_scr, cohort)\n",
        "\n",
        "    # 3) TTE\n",
        "    evt = build_event_times(df_scr, out, HOSP)\n",
        "\n",
        "    # 4) 배치 결과 → confounder 피처\n",
        "    note_feat = llm_features_from_batch_outputs(df_outputs)\n",
        "    print(f\"[features] rows={len(note_feat)}  with confounders={CONFOUNDERS}\")\n",
        "\n",
        "    # 5) Covariates\n",
        "    dfc = build_covariates(HOSP, out, note_feat)\n",
        "    dfc = dfc.merge(evt[[\"subject_id\",\"hadm_id\",\"duration_days\",\"event_observed\"]],\n",
        "                    on=[\"subject_id\",\"hadm_id\"], how=\"left\")\n",
        "    dfc = dfc.dropna(subset=[\"vpt_flag\",\"aki\",\"duration_days\",\"event_observed\"]).reset_index(drop=True)\n",
        "\n",
        "    print(f\"[analytic] N={len(dfc)}  events={int(dfc['event_observed'].sum())}  treated={int(dfc['vpt_flag'].sum())}\")\n",
        "\n",
        "    # 6) Evaluate BASE vs BASE+LLM\n",
        "    base_covs = [\"age\",\"sexM\",\"is_emerg\",\"baseline\"]\n",
        "    llm_covs  = base_covs + [c for c in CONFOUNDERS if c in dfc.columns]\n",
        "\n",
        "    m_base = evaluate_covset(dfc, base_covs, \"BASE\")\n",
        "    m_llm  = evaluate_covset(dfc, llm_covs,  \"BASE+LLM\")\n",
        "\n",
        "    perf = pd.DataFrame([m_base, m_llm])\n",
        "    perf.to_csv(OUTD/\"perf_base_vs_llm.csv\", index=False)\n",
        "\n",
        "    print(\"\\n=== Performance (BASE vs BASE+LLM) ===\")\n",
        "    cols_show = [\n",
        "        \"covset\",\"k_covs\",\n",
        "        \"mean_abs_SMD_before\",\"mean_abs_SMD_after\",\n",
        "        \"ESS\",\"KS_PS\",\n",
        "        \"IPTW_HR\",\"IPTW_LCL\",\"IPTW_UCL\",\n",
        "        \"DR_HR\",\"DR_LCL\",\"DR_UCL\",\n",
        "        \"Evalue_point\",\"Evalue_CI\"\n",
        "    ]\n",
        "    print(perf[cols_show])\n",
        "    print(f\"[saved] {OUTD/'perf_base_vs_llm.csv'}\")\n",
        "\n",
        "    return dfc, perf"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "siiCJcSo4MEg"
      },
      "outputs": [],
      "source": [
        "df_outputs = pd.read_csv(\"/content/drive/MyDrive/data/mimiciv/3.1/results_ci/causal_inferencebatches_outputs.csv\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 1000
        },
        "id": "TBL0umaN4WK3",
        "outputId": "225076a1-a62e-4749-ad6d-6837279ddd30"
      },
      "outputs": [
        {
          "data": {
            "application/vnd.google.colaboratory.intrinsic+json": {
              "type": "dataframe",
              "variable_name": "df_outputs"
            },
            "text/html": [
              "\n",
              "  <div id=\"df-e4f3036b-90d8-4fc0-af95-c07d524728ba\" class=\"colab-df-container\">\n",
              "    <div>\n",
              "<style scoped>\n",
              "    .dataframe tbody tr th:only-of-type {\n",
              "        vertical-align: middle;\n",
              "    }\n",
              "\n",
              "    .dataframe tbody tr th {\n",
              "        vertical-align: top;\n",
              "    }\n",
              "\n",
              "    .dataframe thead th {\n",
              "        text-align: right;\n",
              "    }\n",
              "</style>\n",
              "<table border=\"1\" class=\"dataframe\">\n",
              "  <thead>\n",
              "    <tr style=\"text-align: right;\">\n",
              "      <th></th>\n",
              "      <th>batch_id</th>\n",
              "      <th>request_id</th>\n",
              "      <th>custom_id</th>\n",
              "      <th>http_status</th>\n",
              "      <th>api_request_id</th>\n",
              "      <th>model</th>\n",
              "      <th>assistant_role</th>\n",
              "      <th>assistant_text</th>\n",
              "      <th>finish_reason</th>\n",
              "      <th>prompt_tokens</th>\n",
              "      <th>completion_tokens</th>\n",
              "      <th>total_tokens</th>\n",
              "      <th>response_body_id</th>\n",
              "      <th>created</th>\n",
              "      <th>system_fingerprint</th>\n",
              "      <th>error</th>\n",
              "      <th>error_code</th>\n",
              "    </tr>\n",
              "  </thead>\n",
              "  <tbody>\n",
              "    <tr>\n",
              "      <th>0</th>\n",
              "      <td>batch_68ac33277ba881908f0432ed60f473e9</td>\n",
              "      <td>batch_req_68ac38fdfcf88190afdd4734d0178bec</td>\n",
              "      <td>10000032_22595853</td>\n",
              "      <td>200</td>\n",
              "      <td>09d9c1519aa33749a6511a0199adb022</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>2521</td>\n",
              "      <td>53</td>\n",
              "      <td>2574</td>\n",
              "      <td>chatcmpl-C8OLATG3pViogJE2wR9kIRhwSKeNq</td>\n",
              "      <td>1756116224</td>\n",
              "      <td>fp_51db84afab</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>1</th>\n",
              "      <td>batch_68ac33277ba881908f0432ed60f473e9</td>\n",
              "      <td>batch_req_68ac38fdf5248190b2e9094e23f2be13</td>\n",
              "      <td>10000032_22841357</td>\n",
              "      <td>200</td>\n",
              "      <td>b531ba2fd53a746599a35a3e35553099</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>3424</td>\n",
              "      <td>53</td>\n",
              "      <td>3477</td>\n",
              "      <td>chatcmpl-C8OLEiHJjus6hcnAFhd7SNJrXTPyO</td>\n",
              "      <td>1756116228</td>\n",
              "      <td>fp_560af6e559</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>2</th>\n",
              "      <td>batch_68ac33277ba881908f0432ed60f473e9</td>\n",
              "      <td>batch_req_68ac38fdf678819080f49e041d96fe70</td>\n",
              "      <td>10000032_25742920</td>\n",
              "      <td>200</td>\n",
              "      <td>da42a4a8fabba835d4e7f07083d4f81d</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>3459</td>\n",
              "      <td>53</td>\n",
              "      <td>3512</td>\n",
              "      <td>chatcmpl-C8OLC3T669ISRNPs2ORkRkynz5T2a</td>\n",
              "      <td>1756116226</td>\n",
              "      <td>fp_51db84afab</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>3</th>\n",
              "      <td>batch_68ac33277ba881908f0432ed60f473e9</td>\n",
              "      <td>batch_req_68ac38fdf81081908d3095c4a15c7ed4</td>\n",
              "      <td>10000032_29079034</td>\n",
              "      <td>200</td>\n",
              "      <td>51c0a3ea5656d56c8b1301ef64c8d531</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>3381</td>\n",
              "      <td>53</td>\n",
              "      <td>3434</td>\n",
              "      <td>chatcmpl-C8OLCjVkZAlfuw4ZCGxiLyIwQL4Jy</td>\n",
              "      <td>1756116226</td>\n",
              "      <td>fp_51db84afab</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>4</th>\n",
              "      <td>batch_68ac33277ba881908f0432ed60f473e9</td>\n",
              "      <td>batch_req_68ac38fdfbc8819086cbd3b73aa5b354</td>\n",
              "      <td>10000084_23052089</td>\n",
              "      <td>200</td>\n",
              "      <td>f57a3d858c6d76e70ab21a61781240f0</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 0,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>3009</td>\n",
              "      <td>53</td>\n",
              "      <td>3062</td>\n",
              "      <td>chatcmpl-C8OLEns9QpypGzSkll89ZSmRojiWk</td>\n",
              "      <td>1756116228</td>\n",
              "      <td>fp_560af6e559</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>...</th>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "      <td>...</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>331788</th>\n",
              "      <td>batch_68ac3626e4d48190aa35489149fa4cab</td>\n",
              "      <td>batch_req_68ad280543f48190a25e781cd209a129</td>\n",
              "      <td>11533102_22785311</td>\n",
              "      <td>200</td>\n",
              "      <td>059acedf8f1758de5ef62181b5ed9122</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>4788</td>\n",
              "      <td>53</td>\n",
              "      <td>4841</td>\n",
              "      <td>chatcmpl-C8aTffiLORG90D1JvCZyhlay9Y18i</td>\n",
              "      <td>1756162879</td>\n",
              "      <td>fp_560af6e559</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>331789</th>\n",
              "      <td>batch_68ac3626e4d48190aa35489149fa4cab</td>\n",
              "      <td>batch_req_68ad2805462c8190b36a2d8ac99aecb3</td>\n",
              "      <td>11533102_27365014</td>\n",
              "      <td>200</td>\n",
              "      <td>37e5986cee5fef365601fcc839edd781</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>4721</td>\n",
              "      <td>53</td>\n",
              "      <td>4774</td>\n",
              "      <td>chatcmpl-C8aTeQzfsobgDlgNS0KTHky2nb164</td>\n",
              "      <td>1756162878</td>\n",
              "      <td>fp_560af6e559</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>331790</th>\n",
              "      <td>batch_68ac3626e4d48190aa35489149fa4cab</td>\n",
              "      <td>batch_req_68ad28055f4881909bf6ab7417ba2c02</td>\n",
              "      <td>11533102_28939043</td>\n",
              "      <td>200</td>\n",
              "      <td>d1de20de7e1be514215bdf1b5a2da4ef</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>2819</td>\n",
              "      <td>53</td>\n",
              "      <td>2872</td>\n",
              "      <td>chatcmpl-C8ajAmpyF9i7XW2mZfBB8JyeIpBdu</td>\n",
              "      <td>1756163840</td>\n",
              "      <td>fp_560af6e559</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>331791</th>\n",
              "      <td>batch_68ac3626e4d48190aa35489149fa4cab</td>\n",
              "      <td>batch_req_68ad28055db881908657709086a412dd</td>\n",
              "      <td>11533102_29936329</td>\n",
              "      <td>200</td>\n",
              "      <td>a43a83e7f1bc7675ae528b9c320a581a</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>4184</td>\n",
              "      <td>53</td>\n",
              "      <td>4237</td>\n",
              "      <td>chatcmpl-C8aTgCWVMemYqzETqS643rDcjrqwV</td>\n",
              "      <td>1756162880</td>\n",
              "      <td>fp_51db84afab</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>331792</th>\n",
              "      <td>batch_68ac3626e4d48190aa35489149fa4cab</td>\n",
              "      <td>batch_req_68ad2805aa00819083261e6a0ce5029e</td>\n",
              "      <td>11533158_26616882</td>\n",
              "      <td>200</td>\n",
              "      <td>85e4b8555db7c1337f276ecfb37850c7</td>\n",
              "      <td>gpt-4o-mini-2024-07-18</td>\n",
              "      <td>assistant</td>\n",
              "      <td>{\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...</td>\n",
              "      <td>stop</td>\n",
              "      <td>2259</td>\n",
              "      <td>53</td>\n",
              "      <td>2312</td>\n",
              "      <td>chatcmpl-C8aTf0H6EiPQ93WYNbD9yNPRcNJAj</td>\n",
              "      <td>1756162879</td>\n",
              "      <td>fp_560af6e559</td>\n",
              "      <td>NaN</td>\n",
              "      <td>NaN</td>\n",
              "    </tr>\n",
              "  </tbody>\n",
              "</table>\n",
              "<p>331793 rows × 17 columns</p>\n",
              "</div>\n",
              "    <div class=\"colab-df-buttons\">\n",
              "\n",
              "  <div class=\"colab-df-container\">\n",
              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-e4f3036b-90d8-4fc0-af95-c07d524728ba')\"\n",
              "            title=\"Convert this dataframe to an interactive table.\"\n",
              "            style=\"display:none;\">\n",
              "\n",
              "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\" viewBox=\"0 -960 960 960\">\n",
              "    <path d=\"M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z\"/>\n",
              "  </svg>\n",
              "    </button>\n",
              "\n",
              "  <style>\n",
              "    .colab-df-container {\n",
              "      display:flex;\n",
              "      gap: 12px;\n",
              "    }\n",
              "\n",
              "    .colab-df-convert {\n",
              "      background-color: #E8F0FE;\n",
              "      border: none;\n",
              "      border-radius: 50%;\n",
              "      cursor: pointer;\n",
              "      display: none;\n",
              "      fill: #1967D2;\n",
              "      height: 32px;\n",
              "      padding: 0 0 0 0;\n",
              "      width: 32px;\n",
              "    }\n",
              "\n",
              "    .colab-df-convert:hover {\n",
              "      background-color: #E2EBFA;\n",
              "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
              "      fill: #174EA6;\n",
              "    }\n",
              "\n",
              "    .colab-df-buttons div {\n",
              "      margin-bottom: 4px;\n",
              "    }\n",
              "\n",
              "    [theme=dark] .colab-df-convert {\n",
              "      background-color: #3B4455;\n",
              "      fill: #D2E3FC;\n",
              "    }\n",
              "\n",
              "    [theme=dark] .colab-df-convert:hover {\n",
              "      background-color: #434B5C;\n",
              "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
              "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
              "      fill: #FFFFFF;\n",
              "    }\n",
              "  </style>\n",
              "\n",
              "    <script>\n",
              "      const buttonEl =\n",
              "        document.querySelector('#df-e4f3036b-90d8-4fc0-af95-c07d524728ba button.colab-df-convert');\n",
              "      buttonEl.style.display =\n",
              "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
              "\n",
              "      async function convertToInteractive(key) {\n",
              "        const element = document.querySelector('#df-e4f3036b-90d8-4fc0-af95-c07d524728ba');\n",
              "        const dataTable =\n",
              "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
              "                                                    [key], {});\n",
              "        if (!dataTable) return;\n",
              "\n",
              "        const docLinkHtml = 'Like what you see? Visit the ' +\n",
              "          '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
              "          + ' to learn more about interactive tables.';\n",
              "        element.innerHTML = '';\n",
              "        dataTable['output_type'] = 'display_data';\n",
              "        await google.colab.output.renderOutput(dataTable, element);\n",
              "        const docLink = document.createElement('div');\n",
              "        docLink.innerHTML = docLinkHtml;\n",
              "        element.appendChild(docLink);\n",
              "      }\n",
              "    </script>\n",
              "  </div>\n",
              "\n",
              "\n",
              "    <div id=\"df-3106a3f6-5473-49c0-857f-ed65c8457e79\">\n",
              "      <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-3106a3f6-5473-49c0-857f-ed65c8457e79')\"\n",
              "                title=\"Suggest charts\"\n",
              "                style=\"display:none;\">\n",
              "\n",
              "<svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
              "     width=\"24px\">\n",
              "    <g>\n",
              "        <path d=\"M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z\"/>\n",
              "    </g>\n",
              "</svg>\n",
              "      </button>\n",
              "\n",
              "<style>\n",
              "  .colab-df-quickchart {\n",
              "      --bg-color: #E8F0FE;\n",
              "      --fill-color: #1967D2;\n",
              "      --hover-bg-color: #E2EBFA;\n",
              "      --hover-fill-color: #174EA6;\n",
              "      --disabled-fill-color: #AAA;\n",
              "      --disabled-bg-color: #DDD;\n",
              "  }\n",
              "\n",
              "  [theme=dark] .colab-df-quickchart {\n",
              "      --bg-color: #3B4455;\n",
              "      --fill-color: #D2E3FC;\n",
              "      --hover-bg-color: #434B5C;\n",
              "      --hover-fill-color: #FFFFFF;\n",
              "      --disabled-bg-color: #3B4455;\n",
              "      --disabled-fill-color: #666;\n",
              "  }\n",
              "\n",
              "  .colab-df-quickchart {\n",
              "    background-color: var(--bg-color);\n",
              "    border: none;\n",
              "    border-radius: 50%;\n",
              "    cursor: pointer;\n",
              "    display: none;\n",
              "    fill: var(--fill-color);\n",
              "    height: 32px;\n",
              "    padding: 0;\n",
              "    width: 32px;\n",
              "  }\n",
              "\n",
              "  .colab-df-quickchart:hover {\n",
              "    background-color: var(--hover-bg-color);\n",
              "    box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
              "    fill: var(--button-hover-fill-color);\n",
              "  }\n",
              "\n",
              "  .colab-df-quickchart-complete:disabled,\n",
              "  .colab-df-quickchart-complete:disabled:hover {\n",
              "    background-color: var(--disabled-bg-color);\n",
              "    fill: var(--disabled-fill-color);\n",
              "    box-shadow: none;\n",
              "  }\n",
              "\n",
              "  .colab-df-spinner {\n",
              "    border: 2px solid var(--fill-color);\n",
              "    border-color: transparent;\n",
              "    border-bottom-color: var(--fill-color);\n",
              "    animation:\n",
              "      spin 1s steps(1) infinite;\n",
              "  }\n",
              "\n",
              "  @keyframes spin {\n",
              "    0% {\n",
              "      border-color: transparent;\n",
              "      border-bottom-color: var(--fill-color);\n",
              "      border-left-color: var(--fill-color);\n",
              "    }\n",
              "    20% {\n",
              "      border-color: transparent;\n",
              "      border-left-color: var(--fill-color);\n",
              "      border-top-color: var(--fill-color);\n",
              "    }\n",
              "    30% {\n",
              "      border-color: transparent;\n",
              "      border-left-color: var(--fill-color);\n",
              "      border-top-color: var(--fill-color);\n",
              "      border-right-color: var(--fill-color);\n",
              "    }\n",
              "    40% {\n",
              "      border-color: transparent;\n",
              "      border-right-color: var(--fill-color);\n",
              "      border-top-color: var(--fill-color);\n",
              "    }\n",
              "    60% {\n",
              "      border-color: transparent;\n",
              "      border-right-color: var(--fill-color);\n",
              "    }\n",
              "    80% {\n",
              "      border-color: transparent;\n",
              "      border-right-color: var(--fill-color);\n",
              "      border-bottom-color: var(--fill-color);\n",
              "    }\n",
              "    90% {\n",
              "      border-color: transparent;\n",
              "      border-bottom-color: var(--fill-color);\n",
              "    }\n",
              "  }\n",
              "</style>\n",
              "\n",
              "      <script>\n",
              "        async function quickchart(key) {\n",
              "          const quickchartButtonEl =\n",
              "            document.querySelector('#' + key + ' button');\n",
              "          quickchartButtonEl.disabled = true;  // To prevent multiple clicks.\n",
              "          quickchartButtonEl.classList.add('colab-df-spinner');\n",
              "          try {\n",
              "            const charts = await google.colab.kernel.invokeFunction(\n",
              "                'suggestCharts', [key], {});\n",
              "          } catch (error) {\n",
              "            console.error('Error during call to suggestCharts:', error);\n",
              "          }\n",
              "          quickchartButtonEl.classList.remove('colab-df-spinner');\n",
              "          quickchartButtonEl.classList.add('colab-df-quickchart-complete');\n",
              "        }\n",
              "        (() => {\n",
              "          let quickchartButtonEl =\n",
              "            document.querySelector('#df-3106a3f6-5473-49c0-857f-ed65c8457e79 button');\n",
              "          quickchartButtonEl.style.display =\n",
              "            google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
              "        })();\n",
              "      </script>\n",
              "    </div>\n",
              "\n",
              "  <div id=\"id_90697448-5e7a-40fc-84c7-2fa4925c3449\">\n",
              "    <style>\n",
              "      .colab-df-generate {\n",
              "        background-color: #E8F0FE;\n",
              "        border: none;\n",
              "        border-radius: 50%;\n",
              "        cursor: pointer;\n",
              "        display: none;\n",
              "        fill: #1967D2;\n",
              "        height: 32px;\n",
              "        padding: 0 0 0 0;\n",
              "        width: 32px;\n",
              "      }\n",
              "\n",
              "      .colab-df-generate:hover {\n",
              "        background-color: #E2EBFA;\n",
              "        box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
              "        fill: #174EA6;\n",
              "      }\n",
              "\n",
              "      [theme=dark] .colab-df-generate {\n",
              "        background-color: #3B4455;\n",
              "        fill: #D2E3FC;\n",
              "      }\n",
              "\n",
              "      [theme=dark] .colab-df-generate:hover {\n",
              "        background-color: #434B5C;\n",
              "        box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
              "        filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
              "        fill: #FFFFFF;\n",
              "      }\n",
              "    </style>\n",
              "    <button class=\"colab-df-generate\" onclick=\"generateWithVariable('df_outputs')\"\n",
              "            title=\"Generate code using this dataframe.\"\n",
              "            style=\"display:none;\">\n",
              "\n",
              "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
              "       width=\"24px\">\n",
              "    <path d=\"M7,19H8.4L18.45,9,17,7.55,7,17.6ZM5,21V16.75L18.45,3.32a2,2,0,0,1,2.83,0l1.4,1.43a1.91,1.91,0,0,1,.58,1.4,1.91,1.91,0,0,1-.58,1.4L9.25,21ZM18.45,9,17,7.55Zm-12,3A5.31,5.31,0,0,0,4.9,8.1,5.31,5.31,0,0,0,1,6.5,5.31,5.31,0,0,0,4.9,4.9,5.31,5.31,0,0,0,6.5,1,5.31,5.31,0,0,0,8.1,4.9,5.31,5.31,0,0,0,12,6.5,5.46,5.46,0,0,0,6.5,12Z\"/>\n",
              "  </svg>\n",
              "    </button>\n",
              "    <script>\n",
              "      (() => {\n",
              "      const buttonEl =\n",
              "        document.querySelector('#id_90697448-5e7a-40fc-84c7-2fa4925c3449 button.colab-df-generate');\n",
              "      buttonEl.style.display =\n",
              "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
              "\n",
              "      buttonEl.onclick = () => {\n",
              "        google.colab.notebook.generateWithVariable('df_outputs');\n",
              "      }\n",
              "      })();\n",
              "    </script>\n",
              "  </div>\n",
              "\n",
              "    </div>\n",
              "  </div>\n"
            ],
            "text/plain": [
              "                                      batch_id  \\\n",
              "0       batch_68ac33277ba881908f0432ed60f473e9   \n",
              "1       batch_68ac33277ba881908f0432ed60f473e9   \n",
              "2       batch_68ac33277ba881908f0432ed60f473e9   \n",
              "3       batch_68ac33277ba881908f0432ed60f473e9   \n",
              "4       batch_68ac33277ba881908f0432ed60f473e9   \n",
              "...                                        ...   \n",
              "331788  batch_68ac3626e4d48190aa35489149fa4cab   \n",
              "331789  batch_68ac3626e4d48190aa35489149fa4cab   \n",
              "331790  batch_68ac3626e4d48190aa35489149fa4cab   \n",
              "331791  batch_68ac3626e4d48190aa35489149fa4cab   \n",
              "331792  batch_68ac3626e4d48190aa35489149fa4cab   \n",
              "\n",
              "                                        request_id          custom_id  \\\n",
              "0       batch_req_68ac38fdfcf88190afdd4734d0178bec  10000032_22595853   \n",
              "1       batch_req_68ac38fdf5248190b2e9094e23f2be13  10000032_22841357   \n",
              "2       batch_req_68ac38fdf678819080f49e041d96fe70  10000032_25742920   \n",
              "3       batch_req_68ac38fdf81081908d3095c4a15c7ed4  10000032_29079034   \n",
              "4       batch_req_68ac38fdfbc8819086cbd3b73aa5b354  10000084_23052089   \n",
              "...                                            ...                ...   \n",
              "331788  batch_req_68ad280543f48190a25e781cd209a129  11533102_22785311   \n",
              "331789  batch_req_68ad2805462c8190b36a2d8ac99aecb3  11533102_27365014   \n",
              "331790  batch_req_68ad28055f4881909bf6ab7417ba2c02  11533102_28939043   \n",
              "331791  batch_req_68ad28055db881908657709086a412dd  11533102_29936329   \n",
              "331792  batch_req_68ad2805aa00819083261e6a0ce5029e  11533158_26616882   \n",
              "\n",
              "        http_status                    api_request_id                   model  \\\n",
              "0               200  09d9c1519aa33749a6511a0199adb022  gpt-4o-mini-2024-07-18   \n",
              "1               200  b531ba2fd53a746599a35a3e35553099  gpt-4o-mini-2024-07-18   \n",
              "2               200  da42a4a8fabba835d4e7f07083d4f81d  gpt-4o-mini-2024-07-18   \n",
              "3               200  51c0a3ea5656d56c8b1301ef64c8d531  gpt-4o-mini-2024-07-18   \n",
              "4               200  f57a3d858c6d76e70ab21a61781240f0  gpt-4o-mini-2024-07-18   \n",
              "...             ...                               ...                     ...   \n",
              "331788          200  059acedf8f1758de5ef62181b5ed9122  gpt-4o-mini-2024-07-18   \n",
              "331789          200  37e5986cee5fef365601fcc839edd781  gpt-4o-mini-2024-07-18   \n",
              "331790          200  d1de20de7e1be514215bdf1b5a2da4ef  gpt-4o-mini-2024-07-18   \n",
              "331791          200  a43a83e7f1bc7675ae528b9c320a581a  gpt-4o-mini-2024-07-18   \n",
              "331792          200  85e4b8555db7c1337f276ecfb37850c7  gpt-4o-mini-2024-07-18   \n",
              "\n",
              "       assistant_role                                     assistant_text  \\\n",
              "0           assistant  {\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...   \n",
              "1           assistant  {\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...   \n",
              "2           assistant  {\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...   \n",
              "3           assistant  {\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...   \n",
              "4           assistant  {\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 0,\\n  \"f_h...   \n",
              "...               ...                                                ...   \n",
              "331788      assistant  {\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...   \n",
              "331789      assistant  {\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...   \n",
              "331790      assistant  {\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...   \n",
              "331791      assistant  {\\n  \"f_ckd_pre\": 0,\\n  \"f_dm_pre\": 1,\\n  \"f_h...   \n",
              "331792      assistant  {\\n  \"f_ckd_pre\": 1,\\n  \"f_dm_pre\": 0,\\n  \"f_h...   \n",
              "\n",
              "       finish_reason  prompt_tokens  completion_tokens  total_tokens  \\\n",
              "0               stop           2521                 53          2574   \n",
              "1               stop           3424                 53          3477   \n",
              "2               stop           3459                 53          3512   \n",
              "3               stop           3381                 53          3434   \n",
              "4               stop           3009                 53          3062   \n",
              "...              ...            ...                ...           ...   \n",
              "331788          stop           4788                 53          4841   \n",
              "331789          stop           4721                 53          4774   \n",
              "331790          stop           2819                 53          2872   \n",
              "331791          stop           4184                 53          4237   \n",
              "331792          stop           2259                 53          2312   \n",
              "\n",
              "                              response_body_id     created system_fingerprint  \\\n",
              "0       chatcmpl-C8OLATG3pViogJE2wR9kIRhwSKeNq  1756116224      fp_51db84afab   \n",
              "1       chatcmpl-C8OLEiHJjus6hcnAFhd7SNJrXTPyO  1756116228      fp_560af6e559   \n",
              "2       chatcmpl-C8OLC3T669ISRNPs2ORkRkynz5T2a  1756116226      fp_51db84afab   \n",
              "3       chatcmpl-C8OLCjVkZAlfuw4ZCGxiLyIwQL4Jy  1756116226      fp_51db84afab   \n",
              "4       chatcmpl-C8OLEns9QpypGzSkll89ZSmRojiWk  1756116228      fp_560af6e559   \n",
              "...                                        ...         ...                ...   \n",
              "331788  chatcmpl-C8aTffiLORG90D1JvCZyhlay9Y18i  1756162879      fp_560af6e559   \n",
              "331789  chatcmpl-C8aTeQzfsobgDlgNS0KTHky2nb164  1756162878      fp_560af6e559   \n",
              "331790  chatcmpl-C8ajAmpyF9i7XW2mZfBB8JyeIpBdu  1756163840      fp_560af6e559   \n",
              "331791  chatcmpl-C8aTgCWVMemYqzETqS643rDcjrqwV  1756162880      fp_51db84afab   \n",
              "331792  chatcmpl-C8aTf0H6EiPQ93WYNbD9yNPRcNJAj  1756162879      fp_560af6e559   \n",
              "\n",
              "        error  error_code  \n",
              "0         NaN         NaN  \n",
              "1         NaN         NaN  \n",
              "2         NaN         NaN  \n",
              "3         NaN         NaN  \n",
              "4         NaN         NaN  \n",
              "...       ...         ...  \n",
              "331788    NaN         NaN  \n",
              "331789    NaN         NaN  \n",
              "331790    NaN         NaN  \n",
              "331791    NaN         NaN  \n",
              "331792    NaN         NaN  \n",
              "\n",
              "[331793 rows x 17 columns]"
            ]
          },
          "execution_count": 9,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "df_outputs"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "POgaFody4hR3",
        "outputId": "f6331059-79bd-4087-e2bf-652b8cc1c4c6"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "[cohort] N=90327  VPT=7822\n",
            "[scr ids] K=3  sample: [50912, 52024, 52546]\n",
            "[scr ts] rows=1172668\n",
            "[aki] rate=0.175  N=90327\n",
            "[tte] rows=90327 events=15811\n",
            "[features] rows=331793  with confounders=['f_ckd_pre', 'f_dm_pre', 'f_hf_pre', 'f_liver_pre', 'f_nephrotox_pre']\n",
            "[analytic] N=90327  events=15811  treated=7822\n",
            "\n",
            "=== Performance (BASE vs BASE+LLM) ===\n",
            "     covset  k_covs  mean_abs_SMD_before  mean_abs_SMD_after           ESS  \\\n",
            "0      BASE       4             0.089088            0.017767  90063.509977   \n",
            "1  BASE+LLM       9             0.100799            0.017629  89869.120563   \n",
            "\n",
            "      KS_PS   IPTW_HR  IPTW_LCL  IPTW_UCL     DR_HR    DR_LCL    DR_UCL  \\\n",
            "0  0.098516  1.439858  1.389221   1.49234  1.441970  1.390700  1.495131   \n",
            "1  0.128194  1.399645  1.350395   1.45069  1.402752  1.352899  1.454443   \n",
            "\n",
            "   Evalue_point  Evalue_CI  \n",
            "0      2.235679   2.124554  \n",
            "1      2.147549   2.038270  \n",
            "[saved] /content/drive/MyDrive/results_ci/perf_base_vs_llm.csv\n"
          ]
        }
      ],
      "source": [
        "dfc, perf = run_pipeline_with_batch_features(HOSP, NOTE, df_outputs)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 361
        },
        "id": "H4B9kDBH8PCD",
        "outputId": "3d0f68b7-5ea8-4632-833d-e6451aef91f7"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "PS AUC: BASE vs LLM → 0.5625350112049337 vs 0.5854034740710027\n",
            "PS KS:  BASE vs LLM → 0.09851579778425834 vs 0.12819418009129901\n",
            "ESS(LLM): 89869.12056348818\n"
          ]
        },
        {
          "data": {
            "image/png": "iVBORw0KGgoAAAANSUhEUgAAAk4AAAEiCAYAAAAPh11JAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjAsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvlHJYcgAAAAlwSFlzAAAPYQAAD2EBqD+naQAAaWRJREFUeJzt3XlcVNX7B/DPnRlmGJhhRjbZZBPcRcUtysTEBDM3LBc0MU3LLDXL1PqJIrl8TXPJMnM3NS3X0q/mkriQO2qahIIgoigkMuwzMHN+f0zcryOLA8IMy/N+vebFzL3n3vvcuQPzcM6553CMMQZCCCGEEPJMAnMHQAghhBBSV1DiRAghhBBiJEqcCCGEEEKMRIkTIYQQQoiRKHEihBBCCDESJU6EEEIIIUaixIkQQgghxEiUOBFCCCGEGIkSJ0IIIYQQI1HiRAhpcDZu3AiO45CcnGyS4+Xm5sLR0RFbt241yfHI/9y4cQMikQjXr183dyiknqDEiRBSppLk4uLFi+YOpVbZtm0bli1bVqltli9fDrlcjmHDhvHL5syZA47j+IdAIICzszNef/11nD17ttx9xcXFgeM4WFpaIisrq8wyOp0OmzdvRteuXWFrawu5XI5mzZph1KhRBvuOjo42iOHpx/bt2yt1nmXhOA4ffPBBhWV69OiBNm3aVFim5P0SCAS4e/duqfXZ2dmQSqWljteqVSv07dsXERERVTsBQp4iMncAhBBSl2zbtg3Xr1/HlClTjCpfVFSE5cuX46OPPoJQKCy1ftWqVZDJZNDpdLh79y7WrFmD7t274/z582jfvn2p8lu2bIGTkxMeP36MnTt34p133ilVZtKkSfjmm28wYMAAjBgxAiKRCPHx8Th48CC8vb3xwgsvlCrfuXPnUvsJCAgw6hxNSSKR4Mcff8Snn35qsHz37t3lbvPee+/htddeQ2JiIpo2bVrTIZJ6jhInQgipQfv370dGRgaGDBlS5vo33ngD9vb2/OuBAweiTZs2+Pnnn0slTowxbNu2DWFhYUhKSsLWrVtLJU4PHz7Et99+i3HjxuH77783WLds2TJkZGSUiuHll1/GG2+8Uanzio6OxiuvvIKkpCR4enpWatvn8dprr5WZOG3btg19+/bFrl27Sm3Tq1cvNGrUCJs2bcLcuXNNFSqpp6ipjhDyXC5fvow+ffrAxsYGMpkMQUFBBs1BFy9eBMdx2LRpU6ltf/vtN3Ach/379/PL7t27hzFjxqBx48aQSCRo3bo11q9fb1QsJc00W7duRfPmzWFpaYmOHTvi5MmTRm3/7bffonXr1pBIJHBxccHEiRMNmsN69OiBAwcO4M6dO3xz1rOShr1798LT09Pomg4nJycAgEhU+v/amJgYJCcnY9iwYRg2bBhOnjyJ1NRUgzJJSUlgjOGll14qtT3HcXB0dDQqjtoqLCwMV65cwd9//80ve/DgAX7//XeEhYWVuY2FhQV69OiBffv2mSpMUo9R4kQIqbK//voLL7/8Mq5evYpPP/0Us2bNQlJSEnr06IFz584BADp16gRvb2/89NNPpbbfsWMHGjVqhODgYAD62pIXXngBR48exQcffIDly5fDx8cHY8eONbpf0YkTJzBlyhSMHDkSc+fOxaNHjxASEvLMzsFz5szBxIkT4eLigiVLlmDw4MFYvXo1evfujaKiIgDA559/jvbt28Pe3h4//PADfvjhh2fG9ccff8Df37/c9ZmZmfjnn3+Qnp6Oy5cvY9y4cbC0tCyzhmrr1q1o2rQpOnfujH79+sHKygo//vijQRkPDw8AwM8//4z8/PwKYyuRk5ODf/75p9SDMWbU9qbUvXt3uLm5Ydu2bfyyHTt2QCaToW/fvuVu17FjR1y/fh3Z2dmmCJPUZ4wQQsqwYcMGBoBduHCh3DIDBw5kYrGYJSYm8svu37/P5HI56969O79s5syZzMLCgmVmZvLL1Go1UyqVbMyYMfyysWPHMmdnZ/bPP/8YHGfYsGFMoVCw/Pz8CmMGwACwixcv8svu3LnDLC0t2aBBg0qdW1JSEmOMsfT0dCYWi1nv3r2ZVqvly61cuZIBYOvXr+eX9e3bl3l4eFQYR4mioiLGcRz7+OOPS62bPXs2H++TD6VSyQ4dOlSqvEajYXZ2duzzzz/nl4WFhbF27dqVKjtq1CgGgDVq1IgNGjSILV68mMXFxZUqd/z48TJjKHmkpaWVe24l25a8h+UBwCZOnFhhmcDAQNa6desKy5S8XxkZGeyTTz5hPj4+/LrOnTuzt99+u8Ljbdu2jQFg586dq/A4hDwL1TgRQqpEq9Xi8OHDGDhwILy9vfnlzs7OCAsLw+nTp/n/7ocOHYqioiKDDryHDx9GVlYWhg4dCkDff2fXrl3o168fGGMGNR/BwcFQqVSIjY19ZlwBAQHo2LEj/9rd3R0DBgzAb7/9Bq1WW+Y2R48ehUajwZQpUyAQ/O/P4rhx42BjY4MDBw5U7s35V2ZmJhhjaNSoUblldu3ahSNHjuDw4cPYsGEDmjVrhsGDB+OPP/4wKHfw4EE8evQIw4cP55cNHz4cV69exV9//WVQdsOGDVi5ciW8vLywZ88efPLJJ2jZsiWCgoJw7969UjFERETgyJEjpR62trZ8GZVKZXBNVCoVAODx48cGy3Nzc6v0XlVGWFgYEhIScOHCBf5nec10JUquwT///FPj8ZH6jTqHE0KqJCMjA/n5+WjevHmpdS1btuTvEmvdujXatWuHFi1aYMeOHRg7diwAffOKvb09evbsye8vKysL33//falOzSXS09OfGZevr2+pZc2aNUN+fj4yMjL4PkRPunPnDgCUOhexWAxvb29+fVWxCpq8unfvbtA5/I033oCvry8+/PBDXLp0iV++ZcsWeHl5QSKRICEhAQDQtGlTWFlZYevWrZg/fz5fViAQYOLEiZg4cSIePXqEmJgYfPfddzh48CCGDRuGU6dOGcTQtm1b9OrVq8JzGDBgAE6cOFFq+dPNkOHh4di4cWOF+3peHTp0QIsWLbBt2zYolUo4OTnxn6PylFwDjuNqNDZS/1HiRAgxiaFDh2LevHn4559/IJfL8csvv2D48OF8J2idTgcAGDlyJMLDw8vch5+fn8nirQ62trbgOA6PHz82ehuZTIauXbti3759yMvLg7W1NbKzs/Hrr7+isLCwzMRw27ZtmDdvXplJgZ2dHfr374/+/fujR48eOHHiBO7cucP3hTLWkiVLDM7j6tWr+OSTT7BlyxY0btyYX+7i4lKp/VZVWFgYVq1aBblcjqFDhxrUFJalJPYnk1RCqoISJ0JIlTg4OMDKygrx8fGl1v39998QCARo0qQJv2zo0KGIjIzErl270LhxY2RnZxsMCOng4AC5XA6tVvvM2o+K3Lp1q9SymzdvwsrKCg4ODmVuU5JExMfHGzQ7ajQaJCUlGcRTmRoLkUiEpk2bIikpyehtAKC4uBiAfsRxa2tr7N69G4WFhVi1alWpL/74+Hj83//9H2JiYtCtW7cK99upUyecOHECaWlplU6cnmz+BP53199LL71k0uEISoSFhSEiIgJpaWn44Ycfnlk+KSkJAoEAzZo1M0F0pD6jxIkQUiVCoRC9e/fGvn37kJyczH95Pnz4ENu2bUO3bt1gY2PDl2/ZsiXatm2LHTt2oHHjxnB2dkb37t0N9jd48GB+gMmnR5LOyMgoN/F50pkzZxAbG8s3Id29exf79u1DSEhImQNQAvpxfsRiMVasWIGQkBA+OVq3bh1UKpXB3VrW1tZ8/x5jBAQEIDo62ujymZmZ+OOPP+Dk5MQPHbBlyxZ4e3vjvffeK1VerVZj4cKF2Lp1K7p164YHDx4gMzMTrVq1Miin0Whw7NgxCAQC+Pj4GB1PbdW0aVMsW7YMBQUF6NKlyzPLX7p0Ca1bt4ZCoTBBdKQ+o8SJEFKh9evX49ChQ6WWT548GV988QWOHDmCbt264f3334dIJMLq1auhVquxaNGiUtsMHToUERERsLS0xNixY0s1ryxcuBDHjx9H165dMW7cOLRq1QqZmZmIjY3F0aNHkZmZ+cx427Rpg+DgYEyaNAkSiQTffvstACAyMrLcbRwcHDBz5kxERkYiJCQE/fv3R3x8PL799lt07twZI0eO5Mt27NgRO3bswNSpU9G5c2fIZDL069ev3H0PGDAAP/zwA27evFlmbcfOnTshk8nAGMP9+/exbt06PH78GN999x04jsP9+/dx/PhxTJo0qcz9SyQSBAcH4+eff8aKFSuQmpqKLl26oGfPnggKCoKTkxPS09Px448/4urVq5gyZUqpWqtTp06hsLCw1L79/PyqpXn04sWL+OKLL0ot79GjB19LlpGRUWYZLy8vjBgxosz9Tp482ajjFxUV4cSJE3j//fcrETUh5TDnLX2EkNqr5Jb98h53795ljDEWGxvLgoODmUwmY1ZWVuyVV15hf/zxR5n7vHXrFr/96dOnyyzz8OFDNnHiRNakSRNmYWHBnJycWFBQEPv++++fGTP+vRV9y5YtzNfXl0kkEtahQwd2/PjxMs/t6VvpV65cyVq0aMEsLCxY48aN2YQJE9jjx48NyuTm5rKwsDCmVCoZgGcOTaBWq5m9vT2LiooyWF7WcATW1tYsICCA/fTTT3y5JUuWMADs2LFj5R5j48aNDADbt28fy87OZsuXL2fBwcHMzc2NWVhYMLlczgICAtiaNWuYTqfjt3vWcASzZ88u95iVGY6gvEfJexIYGFhumaCgIIP3KyMj45nHe3o4goMHDzIA7NatWxVuS4gxOMZq4QhnhBBSBRzHYeLEiVi5cqW5QzEQFRWFDRs24NatW+U2F5KaM3DgQHAchz179pg7FFIP0DhOhBBSwz766CPk5uZi+/bt5g6lwYmLi8P+/fsRFRVl7lBIPUF9nAghpIbJZDKjxqAi1a9ly5b8XYqEVAeqcSKEEEIIMRLVOBFC6g3qskkIqWlU40QIIYQQYiRKnAghhBBCjERNdYSn0+lw//59yOVymgiTEEJIvcUYQ05ODlxcXJ45z+HTKHEivPv37xvMLUYIIYTUZ3fv3oWbm1ultqHEifDkcjkA/QfpyTnGCCHVK19TjC7zjgEAzn8eBCsx/SkmxJSys7PRpEkT/nuvMui3lfBKmudsbGwocSKkBok0xRBIrADof98ocSLEPKrSLYU6hxNCCCGEGKlBJk49evTAlClTzB0GIYQQQuqYBlk/vHv3blhYWJg7DFKX6LRA6kUgLwOwdgDcOgECmqyVVI1EJMSP417gnxNSl+h0DMmP8pBTWAy5pQiedtYQCBrOndgNMnGytbU1dwjVhjEGrVYLkahBXkrTuHkYODYXeJwEMC3ACYFGXkBQBNCst7mjI3WQUMAhoKmducMgpNKu31NhV2wqEtJzoS7SQWIhgI+jDIP93dDGVWHu8EyiwTfVffvtt/D19YWlpSUaN26MN954w6h96HQ6LFiwAF5eXpBKpWjXrh127tzJr4+OjgbHcfjtt9/QoUMHSKVS9OzZE+np6Th48CBatmwJGxsbhIWFIT8/v9L7PXjwIDp27AiJRILTp08jJycHI0aMgLW1NZydnbF06VJqkqwONw8Du8cBmQmAUAKI5fqfmYn65TcPmztCQggxiev3VFhx7BaupaqglIrhaW8NpVSMa6n65dfvqcwdokk06GqKixcvYtKkSfjhhx/w4osvIjMzE6dOnTJq2wULFmDLli347rvv4Ovri5MnT2LkyJFwcHBAYGAgX27OnDlYuXIlrKysMGTIEAwZMgQSiQTbtm1Dbm4uBg0ahK+//hrTp0+v1H5nzJiBxYsXw9vbG40aNcLUqVMRExODX375BY0bN0ZERARiY2PRvn37an3PGhSdVl/TpFUDYhug5O4LoQAQiABNDvB7FOATRM12pFKKtDr8eD4FADC8izsshA3yf1hSh+h0DLtiU5GZp4GPo4y/G01mKYKPRIaE9Fzsjr2HVs429b7ZrkEnTikpKbC2tsbrr78OuVwODw8PdOjQ4ZnbqdVqzJ8/H0ePHkVAQAAAwNvbG6dPn8bq1asNEpwvvvgCL730EgBg7NixmDlzJhITE+Ht7Q0AeOONN3D8+HFMnz69UvudO3cuXn31VQBATk4ONm3ahG3btiEoKAgAsGHDBri4uDzzPNRqNf86Ozv7mefeoKRe1DfPiaz+lzSV4DhAJAUyb+vLuXc1T4ykTirS6hCx7y8AwBsd3ShxIrVe8qM8JKTnwlkhLXULP8dxcFZIcSs9B8mP8uDtIDNTlKbRoBOnV199FR4eHvD29kZISAhCQkIwaNAgWFlZVbhdQkIC8vPz+cSlhEajKZV4+fn58c8bN24MKysrPmkqWXb+/PlK77dTp07889u3b6OoqAhdunThlykUCjRv3rzC81iwYAEiIyMrLNOg5WXo+zSVV5skEALFOn05Qgipx3IKi6Eu0kGqKPvvoVQsxMNsHXIKi00cmek16MRJLpcjNjYW0dHROHz4MCIiIjBnzhxcuHABSqWy3O1yc3MBAAcOHICrq6vBOolEYvD6ybv3OI4rdTcfx3HQ6XSV3q+1tbURZ1ixmTNnYurUqfzrkpFUyb+sHfQdwXVaffPc03RagBPoyxFCSD0mtxRBYiFAgUYLmWXp1KFAo4XEQgB5Gevqm/p/hs8gEonQq1cv9OrVC7Nnz4ZSqcTvv/+O0NDQcrdp1aoVJBIJUlJSDJrPnldV9+vt7Q0LCwtcuHAB7u7uAACVSoWbN2+ie/fu5W4nkUhKJWTkCW6d9HfPZSbq+zQ9WT3NGFBcANj56MsRQkg95mlnDR9HGa6lquAjkRk01zHGkKYqgJ+bEp52z/9PfW3XoBOn/fv34/bt2+jevTsaNWqE//73v9DpdM9s4pLL5fjkk0/w0UcfQafToVu3blCpVIiJiYGNjQ3Cw8OrFE9V9yuXyxEeHo5p06bB1tYWjo6OmD17NgQCQZWGkyf/Egj1Qw7sHqfvCC6S6pfptPqkSSgGes6ijuGEkHpPIOAw2N8N9x4X8H2dpGIhCjRapKkKYGstRqi/a73vGA408MRJqVRi9+7dmDNnDgoLC+Hr64sff/wRrVu3fua2UVFRcHBwwIIFC3D79m0olUr4+/vjs88+e66Yqrrfr776Cu+99x5ef/112NjY4NNPP8Xdu3dhaWn5XPE0eM16A6Fr/jeOU7FO3zxn56NPmmgcJ0JIA9HGVYFJQb78OE4Ps/XjOPm5KRHq79pgxnHiGGPM3EGQ6peXlwdXV1csWbIEY8eONWqb7OxsKBQKqFQqmuT3aTRyOKlG+ZpitIr4DQBwY24wTfJL6pT6MHL483zf0W9rPXH58mX8/fff6NKlC1QqFebOnQsAGDBggJkjqycEQhpygFQbsVCA9aM78c8JqUsEAq7eDzlQEUqcypCSkoJWrVqVu/7GjRt8J+zaZPHixYiPj4dYLEbHjh1x6tQp2NvbmzssQshTREIBerZobO4wCCFVQE11ZSguLkZycnK56z09Pevl3HDUVEcIIaQhoKa6aiYSieDj42PuMAgh9VSRVoe9l+8BAAZ2cKWRwwmpQyhxIoQQEyvS6jBt558AgL5+zpQ4EVKH0G8rIYQQQoiRKHEihBBCCDESJU6EEEIIIUaixIkQQgghxEiUOBFCCCGEGIkSJ0IIIYQQI9W7xIkxhvHjx8PW1hYcx+HKlSvllu3RowemTJnCv/b09MSyZctqPEZCSMMmFgrwTZg/vgnzpylXCKlj6t04TocOHcLGjRsRHR0Nb2/vSk05cuHCBVhbW9dgdKTOokl+STUSCQXo6+ds7jAIqRNq26TC9S5xSkxMhLOzM1588cVKb+vg4FADEf0PYwxarbbap2vRaDQQi8XVuk/yhJuHgWNzgcdJANMCnBBo5AUERQDNeps7OkIIqbeu31NhV2wqEtJzoS7SQWIhgI+jDIP93dDGVWGWmOpVHfHo0aPx4YcfIiUlBRzHwdPTs1LbP9lUFxYWhqFDhxqsLyoqgr29PTZv3gwA0Ol0WLBgAby8vCCVStGuXTvs3LmTLx8dHQ2O43Dw4EF07NgREokEp0+frjCGOXPmoH379li9ejWaNGkCKysrDBkyBCqVyuA8Bw4ciHnz5sHFxQXNmzcHANy9exdDhgyBUqmEra0tBgwYUOGce8QINw8Du8cBmQmAUAKI5fqfmYn65TcPmztCUgcVa3U48GcaDvyZhmKtztzhEFIrXb+nwopjt3AtVQWlVAxPe2sopWJcS9Uvv35P9eyd1IB6lTgtX74cc+fOhZubG9LS0nDhwoUq72vEiBH49ddfkZubyy/77bffkJ+fj0GDBgEAFixYgM2bN+O7777DX3/9hY8++ggjR47EiRMnDPY1Y8YMLFy4EHFxcfDz83vmsRMSEvDTTz/h119/xaFDh3D58mW8//77BmWOHTuG+Ph4HDlyBPv370dRURGCg4Mhl8tx6tQpxMTEQCaTISQkBBqNpsrvQ4Om0+prmrRqQGwDCC0ATqD/KZYDWg3we5S+HCGVoNHqMHFbLCZui4WGEidCStHpGHbFpiIzTwMfRxlkliIIBRxkliL4OMqQmafB7th70OmYyWOrV011CoUCcrkcQqEQTk5Oz7Wv4OBgWFtbY8+ePXjrrbcAANu2bUP//v0hl8uhVqsxf/58HD16FAEBAQAAb29vnD59GqtXr0ZgYCC/r7lz5+LVV181+tiFhYXYvHkzXF1dAQBff/01+vbtiyVLlvDnZW1tjbVr1/JNdFu2bIFOp8PatWvBcfq23w0bNkCpVCI6Ohq9e5duUlKr1VCr1fzr7OzsyrxF9V/qRX3znMgK4J5qT+c4QCQFMm/ry7l3NU+MhBBSDyU/ykNCei6cFVL+O60Ex3FwVkhxKz0HyY/y4O0gM2ls9arGqTqJRCIMGTIEW7duBQDk5eVh3759GDFiBAB9rVB+fj5effVVyGQy/rF582YkJiYa7KtTp06VOra7uzufNAFAQEAAdDod4uPj+WVt27Y16Nd09epVJCQkQC6X87HY2tqisLCwVDwlFixYAIVCwT+aNGlSqTjrvbwMfZ+m8jqBC4QA0+nLEUIIqTY5hcVQF+kgFZf991cqFkJdpENOYbGJI6tnNU7VbcSIEQgMDER6ejqOHDkCqVSKkJAQAOCb8A4cOGCQ5ACARCIxeF0Td+o9vc/c3Fx07NiRT/SeVF6n95kzZ2Lq1Kn86+zsbEqenmTtoO8IrtMCZd0yrtPqm+6sa/amAkIIaWjkliJILAQo0GghsyydqhRotJBYCCAvY11No8SpAi+++CKaNGmCHTt24ODBg3jzzTdhYWEBAGjVqhUkEglSUlIMmuWqQ0pKCu7fvw8XFxcAwNmzZyEQCPhO4GXx9/fHjh074OjoCBsbG6OOI5FISiV55AlunfR3z2UmAgKRYXMdY0BxAWDnoy9HCCGk2njaWcPHUYZrqSr4SGQGzXWMMaSpCuDnpoSnnemHEKKmumcICwvDd999hyNHjvDNdAAgl8vxySef4KOPPsKmTZuQmJiI2NhYfP3119i0adNzHdPS0hLh4eG4evUqTp06hUmTJmHIkCEV9tsaMWIE7O3tMWDAAJw6dQpJSUmIjo7GpEmTkJqa+lzxNFgCoX7IAaEY0OQA2iJ905y2SP9aKAZ6zqLxnAghpJoJBBwG+7vB1lqMhPRc5BYWQ6tjyC0sRkJ6LmytxQj1dzXLeE6UOD3DiBEjcOPGDbi6uuKll14yWBcVFYVZs2ZhwYIFaNmyJUJCQnDgwAF4eXk91zF9fHwQGhqK1157Db1794afnx++/fbbCrexsrLCyZMn4e7ujtDQULRs2RJjx45FYWGh0TVQpAzNegOhawDbpvq76zS5+p92PvrlNI4TIYTUiDauCkwK8kVbNwWyCjRI/icPWQUa+LkpMSnI12zjOHGMMdPfy0fKNWfOHOzdu7fCqWJqSnZ2NhQKBVQqFSVbT6ORw0k1KtLqsPfyPQDAwA6usKBpVwgpV02MHP4833fUx4kQYwiENOQAqTYWQgHe7EQ3YhBiDIGAM/mQAxWpt4lTSkoKWrVqVe76GzduwN3d3YQR6bVu3Rp37twpc93q1atNHA0hhBBCKqPeNtUVFxdXON2Ip6dntc8ZZ4w7d+6gqKiozHWNGzeGXC43cUT/Q011hJhGsVaHk7f0439193WAiJrqCDEpaqorg0gkgo+Pj7nDKMXDw8PcIRBCzEyj1WHMxosAgBtzgylxIqQOod9WQgghhBAjUeJECCGEEGIkSpwIIYQQQoxEiRMhhBBCiJEocSKEEEIIMRIlToQQQgghRqq3wxEQQkhtZSEUYO6A1vxzQkjdQYkTIYSYmIVQgFEBnuYOgxBSBQ3iXx3GGMaPHw9bW1twHFflCXSTk5OrtD3Hcdi7d2+VjklqgE4LpJwD4vbrf+q05o6IEFLP6XQMtzNycfVuFm5n5EKnq5eTdjQIDaLG6dChQ9i4cSOio6Ph7e0Ne3t7c4dEzOXmYeDYXOBxEsC0ACcEGnkBQRFAs97mjo40EFodw/mkTABAFy9bCJ9zpndSu12/p8Ku2FQkpOdCXaSDxEIAH0cZBvu7oY2rwtzhkUpqEDVOiYmJcHZ2xosvvggnJyezzFFXUxhjKC4uNncYdcPNw8DucUBmAiCUAGK5/mdmon75zcPmjpA0EOpiLYavOYvha85CXUw1nvXZ9XsqrDh2C9dSVVBKxfC0t4ZSKsa1VP3y6/dU5g6RVFK9T5xGjx6NDz/8ECkpKeA4Dp6enhWW1+l0WLRoEXx8fCCRSODu7o558+aVWVar1WLMmDFo0aIFUlJSAAC3bt1C9+7dYWlpiVatWuHIkSNGx1rSFLh9+3a8+OKLsLS0RJs2bXDixAm+THR0NDiOw8GDB9GxY0dIJBKcPn0aOp0OCxYsgJeXF6RSKdq1a4edO3cafex6T6fV1zRp1YDYBhBaAJxA/1MsB7Qa4PcoarYjhFQbnY5hV2wqMvM08HGUQWYpglDAQWYpgo+jDJl5GuyOvUfNdnVM/al6Kcfy5cvRtGlTfP/997hw4QKEQmGF5WfOnIk1a9Zg6dKl6NatG9LS0vD333+XKqdWqzF8+HAkJyfj1KlTcHBwgE6nQ2hoKBo3boxz585BpVJhypQplY552rRpWLZsGVq1aoWvvvoK/fr1Q1JSEuzs7PgyM2bMwOLFi+Ht7Y1GjRphwYIF2LJlC7777jv4+vri5MmTGDlyJBwcHBAYGFjmcdRqNdRqNf86Ozu70rHWGakX9c1zIiuAe6pZhOMAkRTIvK0v597VPDESQuqV5Ed5SEjPhbNCCu6pvzscx8FZIcWt9BwkP8qDt4PMTFGSyqr3iZNCoYBcLodQKISTk1OFZXNycrB8+XKsXLkS4eHhAICmTZuiW7duBuVyc3PRt29fqNVqHD9+HAqFvo366NGj+Pvvv/Hbb7/BxcUFADB//nz06dOnUjF/8MEHGDx4MABg1apVOHToENatW4dPP/2ULzN37ly8+uqrAPQJ0Pz583H06FEEBAQAALy9vXH69GmsXr263MRpwYIFiIyMrFRsdVZehr5Pk6CcxFkgBIp1+nKEEFINcgqLoS7SQaoo+++OVCzEw2wdcgqpu0VdUu8Tp8qIi4uDWq1GUFBQheWGDx8ONzc3/P7775BKpQbbN2nShE+aAPCJTGU8uY1IJEKnTp0QFxdnUKZTp07884SEBOTn5/OJVAmNRoMOHTqUe5yZM2di6tSp/Ovs7Gw0adKk0vHWCdYO+o7gOi1Q1rg5Oq2+6c7awfSxEULqJbmlCBILAQo0WsgsS3/dFmi0kFgIIC9jHam96Go94ckkqCKvvfYatmzZgjNnzqBnz541HFXZrK2t+ee5ubkAgAMHDsDV1dWgnEQiKXcfEomkwvX1ilsn/d1zmYmAQGTYXMcYUFwA2PnoyxFCSDXwtLOGj6MM11JV8JHIDJrrGGNIUxXAz00JTzvrCvZCapt63zm8Mnx9fSGVSnHs2LEKy02YMAELFy5E//79DTput2zZEnfv3kVaWhq/7OzZs5WO48ltiouLcenSJbRs2bLc8q1atYJEIkFKSgp8fHwMHvW2BqmyBEL9kANCMaDJAbRFANPpf2py9Mt7ziq/KY8QQipJIOAw2N8NttZiJKTnIrewGFodQ25hMRLSc2FrLUaovysENBxFnUI1Tk+wtLTE9OnT8emnn0IsFuOll15CRkYG/vrrL4wdO9ag7IcffgitVovXX38dBw8eRLdu3dCrVy80a9YM4eHh+PLLL5GdnY3PP/+80nF888038PX1RcuWLbF06VI8fvwYY8aMKbe8XC7HJ598go8++gg6nQ7dunWDSqVCTEwMbGxs+P5aDV6z3kDomv+N41Ss0zfP2fnokyYax4mYiEggwMw+LfjnpP5q46rApCBffhynh9n6cZz83JQI9XelcZzqIEqcnjJr1iyIRCJERETg/v37cHZ2xnvvvVdm2SlTpkCn0+G1117DoUOH8OKLL2LPnj0YO3YsunTpAk9PT6xYsQIhISGVimHhwoVYuHAhrly5Ah8fH/zyyy/PHLQzKioKDg4OWLBgAW7fvg2lUgl/f3989tlnlTp2vdesN+ATpL97Li9D36fJrRPVNBGTEosEeDewqbnDICbSxlWBVs42SH6Uh5zCYsgtRfC0s6aapjqKY4zRABK1RHJyMry8vHD58mW0b9/e5MfPzs6GQqGASqWCjY2NyY9PCCGEmMLzfN9RjRMhhJiYVsf4EaPbuCpoyhVC6pAG1biekpICmUxW7qNk9O+aMn/+/HKPXdmxngghdZe6WIsB38RgwDcxNOUKIXVMg6pxcnFxwZUrVypcX5Pee+89DBkypMx1UqkUrq6uoJZTQgghpPZqUImTSCSCj4+P2Y5va2sLW1tbsx2fEEIIIc+nQTXVEUIIIYQ8D0qcCCGEEEKMRIkTIYQQQoiRKHEihBBCCDFSg+ocTgghtYFIIMDkIF/+OSGk7qDEiRBCTEwsEuCjV5uZOwxCSBXQvzqEEEIIIUaiGidS/+m00N29gPQHqcgRKiFs0hmeDjY0wSYxG52OISEjFwDg4yCjzyIhdQglTqR+u3kYBb/NhuBxMhoxLWwgQIbIBT96TEC7V4agjavC3BGSBqiwWIveS08CAG7MDYaVmP4UE1JX0G8rqb9uHkbxzncgKCpEISQAZwkhp4VT8T30T5yDDbkaoN9ISp4IIYQYjfo41SKHDh1Ct27doFQqYWdnh9dffx2JiYn8+j/++APt27eHpaUlOnXqhL1794LjOIP5965fv44+ffpAJpOhcePGeOutt/DPP/+Y4WzMTKcFOzYXuiI18mAFTmgBTsBBx4mgFlhBgmK8/s867LmUAp2O5gckhBBiHEqcapG8vDxMnToVFy9exLFjxyAQCDBo0CDodDpkZ2ejX79+aNu2LWJjYxEVFYXp06cbbJ+VlYWePXuiQ4cOuHjxIg4dOoSHDx+WO7GwWq1Gdna2waPeSL0IlpmEQoghfPp2b46DRiCBiy4NLPUCkh/lmSdGQgghdQ411dUigwcPNni9fv16ODg44MaNGzh9+jQ4jsOaNWtgaWmJVq1a4d69exg3bhxffuXKlejQoQPmz59vsI8mTZrg5s2baNbM8PbnBQsWIDIysmZPylzyMsCYFsWwgKiMfrc6CCFgakg1j5FTWGz6+AghhNRJVONUi9y6dQvDhw+Ht7c3bGxs4OnpCQBISUlBfHw8/Pz8YGlpyZfv0qWLwfZXr17F8ePHIZPJ+EeLFi0AwKDJr8TMmTOhUqn4x927d2vu5EzN2gEcJ4QIWrAyWuIE0ELHCVAgbgS5Jf3/QAghxDj0jVGL9OvXDx4eHlizZg1cXFyg0+nQpk0baDQao7bPzc1Fv3798J///KfUOmdn51LLJBIJJBLJc8ddK7l1AmfrBcv0W8jVCSESPvE/AmMQ69RIFbqCc+sMTztr88VJCCGkTqHEqZZ49OgR4uPjsWbNGrz88ssAgNOnT/Prmzdvji1btkCtVvPJzoULFwz24e/vj127dsHT0xMiUQO/tAIhuKAICHa+A+uiAhRqxQAngpDTwkKnhhoi7Lcfi0Ed3WkMHWJyIoEA47t7888JIXUH/cbWEo0aNYKdnR2+//57JCQk4Pfff8fUqVP59WFhYdDpdBg/fjzi4uLw22+/YfHixQAAjtN/8U+cOBGZmZkYPnw4Lly4gMTERPz22294++23odVqzXJeZtWsN0RvrIXO1huWXDEsWR4EOg3SRK74tWkketJQBMRMxCIBPnutJT57rSXEIvozTEhd0sCrJWoPgUCA7du3Y9KkSWjTpg2aN2+OFStWoEePHgAAGxsb/Prrr5gwYQLat2+Ptm3bIiIiAmFhYXy/JxcXF8TExGD69Ono3bs31Go1PDw8EBISAkFD/a+2WW9IfYJKjRw+jEYOJ4QQUgUcY2V1nSV1wdatW/H2229DpVJBKpU+9/6ys7OhUCigUqlgY2NTDRESQsqi0zHcyyoAALgqpZTEE2Jiz/N9RzVOdcjmzZvh7e0NV1dXXL16FdOnT8eQIUOqJWkihJhOYbEWLy86DoCmXCGkrqHf1jrkwYMHiIiIwIMHD+Ds7Iw333wT8+bNM3dYhBBCSINBiVMd8umnn+LTTz81dxiEEEJIg9VAewwTQgghhFQeJU6EEEIIIUaixIkQQgghxEiUOBFCCCGEGIk6hxNCiIkJBRzeesGDf04IqTsocSKEEBOTiISIGtjG3GEQQqqAmuoIIYQQQoxENU6EEGJijDFk5mkAALbWYn6ibkJI7Uc1Tv/q0aMHpkyZYrbjjx49GgMHDqw18dRqOi2Qcg6I26//qdOaOyJSB+h0DLczcnH1bhZuZ+RCpzPfNJ0FRVp0/OIoOn5xFAVF9PklpC6hGqdaavfu3bCwsDB3GLXPzcPAsbnA4ySAaQFOCDTyAoIigGa9zR0dqaWu31NhV2wqEtJzoS7SQWIhgI+jDIP93dDGVWHu8AghdQjVONVStra2kMvl5g6jdrl5GNg9DshMAIQSQCzX/8xM1C+/edjcEZJa6Po9FVYcu4VrqSoopWJ42ltDKRXjWqp++fV7KnOHSAipQyhxekJxcTE++OADKBQK2NvbY9asWWBMX53/ww8/oFOnTpDL5XByckJYWBjS09P5bR8/fowRI0bAwcEBUqkUvr6+2LBhA7/+7t27GDJkCJRKJWxtbTFgwAAkJyeXG8vTTXWenp6YP38+xowZA7lcDnd3d3z//fcG21T2GHWKTquvadKqAbENILQAOIH+p1gOaDXA71HUbEcM6HQMu2JTkZmngY+jDDJLEYQCDjJLEXwcZcjM02B37D2zNtsRQuoWSpyesGnTJohEIpw/fx7Lly/HV199hbVr1wIAioqKEBUVhatXr2Lv3r1ITk7G6NGj+W1nzZqFGzdu4ODBg4iLi8OqVatgb2/PbxscHAy5XI5Tp04hJiYGMpkMISEh0Gg0Rse3ZMkSdOrUCZcvX8b777+PCRMmID4+vsrHUKvVyM7ONnjUWqkX9c1zIivg6Y60HAeIpEDmbX05Qv6V/CgPCem5cFZIS3XA5jgOzgopbqXnIPlRnpkiJITUNdTH6QlNmjTB0qVLwXEcmjdvjmvXrmHp0qUYN24cxowZw5fz9vbGihUr0LlzZ+Tm5kImkyElJQUdOnRAp06dAOhriErs2LEDOp0Oa9eu5f94b9iwAUqlEtHR0ejd27i+Oa+99href/99AMD06dOxdOlSHD9+HM2bN6/SMRYsWIDIyMgqvVcml5eh79MkEJa9XiAEinX6coT8K6ewGOoiHaSKsj83UrEQD7N1yCksNnFkhJC6imqcnvDCCy8Y/FcaEBCAW7duQavV4tKlS+jXrx/c3d0hl8sRGBgIAEhJSQEATJgwAdu3b0f79u3x6aef4o8//uD3c/XqVSQkJEAul0Mmk0Emk8HW1haFhYVITEw0Oj4/Pz/+OcdxcHJy4psLq3KMmTNnQqVS8Y+7d+8a/2aZmrWDviN4eU1xOq2+6c7awbRxkVpNbimCxEKAAk3Zn5sCjRYSCwHklvQ/JCHEOPTXwgiFhYUIDg5GcHAwtm7dCgcHB6SkpCA4OJhvBuvTpw/u3LmD//73vzhy5AiCgoIwceJELF68GLm5uejYsSO2bt1aat8ODsZ/0T99lx3HcdDpdABQpWNIJBJIJBKjj29Wbp30d89lJgICkWFzHWNAcQFg56MvR8i/PO2s4eMow7VUFXwkMoN/jBhjSFMVwM9NCU87a5PGJRRwGOzvxj8nhNQdlDg94dy5cwavz549C19fX/z999949OgRFi5ciCZNmgAALl4s3ZfGwcEB4eHhCA8Px8svv4xp06Zh8eLF8Pf3x44dO+Do6AgbG5said0UxzArgVA/5MDucYAmR9+nSfBvDVRxASAUAz1nld+URxokwb8Jyr3HBXxfJ6lYiAKNFmmqAthaixHq7wqBiZMXiUiIJUPamfSYhJDqQU11T0hJScHUqVMRHx+PH3/8EV9//TUmT54Md3d3iMVifP3117h9+zZ++eUXREVFGWwbERGBffv2ISEhAX/99Rf279+Pli1bAgBGjBgBe3t7DBgwAKdOnUJSUhKio6MxadIkpKamVkvspjiG2TXrDYSuAWyb6u+u0+Tqf9r56JfTOE6kDG1cFZgU5Iu2bgpkFWiQ/E8esgo08HNTYlKQL43jRAipFKpxesKoUaNQUFCALl26QCgUYvLkyRg/fjw4jsPGjRvx2WefYcWKFfD398fixYvRv39/fluxWIyZM2ciOTkZUqkUL7/8MrZv3w4AsLKywsmTJzF9+nSEhoYiJycHrq6uCAoKqrbaIVMco1Zo1hvwCdLfPZeXoe/T5NaJappIhdq4KtDK2QbJj/KQU1gMuaUInnbWJq9pKsEY40cMl1oIacoVQuoQjpUMVEQavOzsbCgUCqhUqvqVbBFSy+RritEq4jcAwI25wbAS0/+whJjS83zfUVMdIYQQQoiRKHEihBBCCDESJU6EEEIIIUaixIkQQgghxEiUOBFCCCGEGIkSJ0IIIYQQI9E9sIQQYmICjsNrbZ3454SQuoMSJ0IIMTFLCyG+HdHR3GEQQqqAmuoIIYQQQoxEiRMhhBBCiJEocSKEEBPL1xTDc8YBeM44gHxNsbnDIYRUAvVxInWPTkuT/NZBOh2rNZPsEkJIVVHiVMeVzKp+5swZvPDCC/xytVoNFxcXZGZm4vjx4+jRo4eZIqxmNw8Dx+YCj5MApgU4IdDICwiKAJr1Nnd0pBzX76mwKzYVCem5UBfpILEQwMdRhsH+bmjjqjB3eIQQYjRqqqsHmjRpgg0bNhgs27NnD2QymZkiqiE3DwO7xwGZCYBQAojl+p+ZifrlNw+bO0JShuv3VFhx7BaupaqglIrhaW8NpVSMa6n65dfvqcwdIiGEGI0SJxPYuXMn2rZtC6lUCjs7O/Tq1Qt5eXkAgLVr16Jly5awtLREixYt8O233/LbjRkzBn5+flCr1QAAjUaDDh06YNSoUQb7Dw8Px/bt21FQUMAvW79+PcLDw01wdiai0+prmrRqQGwDCC0ATqD/KZYDWg3we5S+HKk1dDqGXbGpyMzTwMdRBpmlCEIBB5mlCD6OMmTmabA79h50OmbuUAkhxCiUONWwtLQ0DB8+HGPGjEFcXByio6MRGhoKxhi2bt2KiIgIzJs3D3FxcZg/fz5mzZqFTZs2AQBWrFiBvLw8zJgxAwDw+eefIysrCytXrjQ4RseOHeHp6Yldu3YBAFJSUnDy5Em89dZbFcamVquRnZ1t8Ki1Ui/qm+dEVsDTAwZyHCCSApm39eVIrZH8KA8J6blwVkj5ZuUSHMfBWSHFrfQcJD/KM1OEhBBSOdTHqYalpaWhuLgYoaGh8PDwAAC0bdsWADB79mwsWbIEoaGhAAAvLy/cuHEDq1evRnh4OGQyGbZs2YLAwEDI5XIsW7YMx48fh42NTanjjBkzBuvXr8fIkSOxceNGvPbaa3BwcKgwtgULFiAyMrKaz7iG5GXo+zSV1wlcIASKdfpypNbIKSyGukgHqaLs6yYVC/EwW4ecQrqzjBBSN1CNUw1r164dgoKC0LZtW7z55ptYs2YNHj9+jLy8PCQmJmLs2LGQyWT844svvkBiYiK/fUBAAD755BNERUXh448/Rrdu3co8zsiRI3HmzBncvn0bGzduxJgxY54Z28yZM6FSqfjH3bt3q+28q521g74jeHlNcTqtvunOuuJkkZiW3FIEiYUABZqyr1uBRguJhQByy4b1P5yA4/BKcwe80tyBplwhpI5pWH+tzEAoFOLIkSP4448/cPjwYXz99df4/PPP8euvvwIA1qxZg65du5bapoROp0NMTAyEQiESEhLKPY6dnR1ef/11jB07FoWFhejTpw9ycnIqjE0ikUAikTzH2ZmQWyf93XOZiYBAZNhcxxhQXADY+ejLkVrD084aPo4yXEtVwUciM2iuY4whTVUAPzclPO2szRil6VlaCLHh7S7mDoMQUgVU42QCHMfhpZdeQmRkJC5fvgyxWIyYmBi4uLjg9u3b8PHxMXh4eXnx23755Zf4+++/ceLECRw6dKjU3XNPGjNmDKKjozFq1CiD5KteEAj1Qw4IxYAmB9AWAUyn/6nJ0S/vOYvGc6plBAIOg/3dYGstRkJ6LnILi6HVMeQWFiMhPRe21mKE+rvSeE6EkDqDapxq2Llz53Ds2DH07t0bjo6OOHfuHDIyMtCyZUtERkZi0qRJUCgUCAkJgVqtxsWLF/H48WNMnToVly9fRkREBHbu3ImXXnoJX331FSZPnozAwEB4e3uXOlZISAgyMjLK7ANVLzTrDYSu+d84TsU6ffOcnY8+aaJxnGqlNq4KTAry5cdxepitH8fJz02JUH9XGseJEFKnUOJUw2xsbHDy5EksW7YM2dnZ8PDwwJIlS9CnTx8AgJWVFb788ktMmzYN1tbWaNu2LaZMmYLCwkKMHDkSo0ePRr9+/QAA48ePx4EDB/DWW2/h5MmTpWqVOI6Dvb29yc/RpJr1BnyCaOTwOqaNqwKtnG1o5PB/5WuK0THqKADg0qxesBLTn2JC6gqOMUYDqBAAQHZ2NhQKBVQqVf2ttSKkFsjXFKNVxG8AgBtzgylxIsTEnuf7jvo4EUIIIYQYiRInQgghhBAjUeJECCGEEGIkSpwIIYQQQoxEiRMhhBBCiJHoVg5CCDExAcehq5ct/5wQUndQ4kQIISZmaSHEjncDzB0GIaQKqKmOEEIIIcRIlDgRQgghhBiJEidCCDGxfE0x/KOOwD/qCPI1xeYOhxBSCdTHiRBCzCAzT2PuEAghVUA1Tk9hjGH8+PGwtbUFx3G4cuVKuWV79OiBKVOmVLi/Bw8e4NVXX4W1tTWUSmW1xkoIIYQQ06Iap6ccOnQIGzduRHR0NLy9vWFvb/9c+1u6dCnS0tJw5coVKBSKaoqyAdBpgdSLQF4GYO0AuHUCBEJzR0VqCZ2OIflRHnIKiyG3FMHTzhoCAd3WTwipeZQ4PSUxMRHOzs548cUXq21/HTt2hK+vb7XsryxFRUWwsLCosf2b3M3DwLG5wOMkgGkBTgg08gKCIoBmvc0dHTGz6/dU2BWbioT0XKiLdJBYCODjKMNgfze0caV/TgghNYua6p4wevRofPjhh0hJSQHHcfD09HzmNjqdDp9++ilsbW3h5OSEOXPm8Os8PT2xa9cubN68GRzHYfTo0c/cH8dxWLVqFfr06QOpVApvb2/s3LmTX5+cnAyO47Bjxw4EBgbC0tISW7duBQCsXbsWLVu2hKWlJVq0aIFvv/22sm+B+d08DOweB2QmAEIJIJbrf2Ym6pffPGzuCIkZXb+nwopjt3AtVQWlVAxPe2sopWJcS9Uvv35PZe4QCSH1HCVOT1i+fDnmzp0LNzc3pKWl4cKFC8/cZtOmTbC2tsa5c+ewaNEizJ07F0eOHAEAXLhwASEhIRgyZAjS0tKwfPlyo+KYNWsWBg8ejKtXr2LEiBEYNmwY4uLiDMrMmDEDkydPRlxcHIKDg7F161ZERERg3rx5iIuLw/z58zFr1ixs2rSp8m+Euei0+pomrRoQ2wBCC4AT6H+K5YBWA/wepS9HGhydjmFXbCoy8zTwcZRBZimCUMBBZimCj6MMmXka7I69B52OmTtUQkg9Rk11T1AoFJDL5RAKhXBycjJqGz8/P8yePRsA4Ovri5UrV+LYsWN49dVX4eDgAIlEAqlUavT+AODNN9/EO++8AwCIiorCkSNH8PXXXxvUIE2ZMgWhoaH869mzZ2PJkiX8Mi8vL9y4cQOrV69GeHh4mcdRq9VQq9X86+zsbKNjrBGpF/XNcyIr4OlpKDgOEEmBzNv6cu5dzRMjMZvkR3lISM+Fs0IK7qnPB8dxcFZIcSs9B8mP8uDtIDNTlMYRcBz83BT8c0JI3UGJ03Py8/MzeO3s7Iz09PTn2mdAQECp10/f3depUyf+eV5eHhITEzF27FiMGzeOX15cXFxhh/QFCxYgMjLyuWKtVnkZ+j5N5XUCFwiBYp2+HGlwcgqLoS7SQaoo+/MhFQvxMFuHnMLaPy6SpYUQv3zQzdxhEEKqgBKn5/R0p2yO46DT6Wr8uNbW1vzz3NxcAMCaNWvQtathTYxQWP6daDNnzsTUqVP519nZ2WjSpEk1R1oJ1g76juA6LSAsoxVZp9U33Vk7mD42YnZySxEkFgIUaLSQWZb+01Wg0UJiIYC8jHWk4dDpdNBoaIyshs7CwqLC77/nQX9haqGzZ89i1KhRBq87dOhQbvnGjRvDxcUFt2/fxogRI4w+jkQigUQiea5Yq5VbJ/3dc5mJgEBk2FzHGFBcANj56MuRBsfTzho+jjJcS1XBRyIzaK5jjCFNVQA/NyU87awr2AupzzQaDZKSkkzyzyup/ZRKJZycnEo17T8vSpxqoZ9//hmdOnVCt27dsHXrVpw/fx7r1q2rcJvIyEhMmjQJCoUCISEhUKvVuHjxIh4/fmxQq1SrCYT6IQd2jwM0Ofo+TYJ/a6CKCwChGOg5i8ZzaqAEAg6D/d1w73EB39dJKhaiQKNFmqoAttZihPq71onxnAo0WvT66gQA4OjUQEjF9Jl+XowxpKWlQSgUokmTJhAI6N6nhooxhvz8fL7bjLOzc7XunxKnWigyMhLbt2/H+++/D2dnZ/z4449o1apVhdu88847sLKywpdffolp06bB2toabdu2febI5rVOs95A6Jr/jeNUrNM3z9n56JMmGsepQWvjqsCkIF9+HKeH2fpxnPzclAj1d60z4zgxMNzLKuCfk+dXXFyM/Px8uLi4wMrKytzhEDOTSqUAgPT0dDg6OlZrsx3HGKPf2lqE4zjs2bMHAwcONPmxs7OzoVAooFKpYGNjY/LjG6CRw0kF6vrI4fmaYrSK+A0AcGNuMKzE9D/s8yosLERSUhI8PT35L03SsBUUFCA5ORleXl6wtLQ0WPc833f020pqJ4GQhhwg5RIIuFo/5AAxj+ruz0Lqrpr6LFAjcDlSUlIgk8nKfaSkpFR6n1u3bi13f61bt66BsyCEEEJIdaIap3K4uLiUGjvp6fWV1b9//1LDBZQoGdaAWk4JIYRU1pw5c7Bq1Sqkp6ebrbtHQ0GJUzlEIhF8fHyqdZ9yuRxyubxa90kIIaTuGj16tMHUWLa2tujcuTMWLVpUaoDl8sTFxSEyMhJ79uzBCy+8gEaNGtVUuATUVEcIISbHgYOvowy+jjJwoD45tYlOx3A7IxdX72bhdkauSeY+DAkJQVpaGtLS0nDs2DGIRCK8/vrrRm+fmJgIABgwYACcnJyqPD5fUVFRlbZraChxIoQQE5OKhTgyNRBHaAynWuX6PRWiDtzA7F/+wrwDcZj9y1+IOnAD1++pavS4EokETk5OcHJyQvv27TFjxgzcvXsXGRn66aXu3r2LIUOGQKlUwtbWFgMGDEBycjIAfRNdv379AAACgYDvEK3T6fhJ6yUSCdq3b49Dhw7xx0xOTgbHcdixYwcCAwNhaWmJrVu3AgDWrl2Lli1bwtLSEi1atDCYJ5VQ4kQIIYTg+j0VVhy7hWupKiilYnjaW0MpFeNaqn55TSdPJXJzc7Flyxb4+PjAzs4ORUVFCA4Ohlwux6lTpxATEwOZTIaQkBBoNBp88skn2LBhAwDwtVYAsHz5cixZsgSLFy/Gn3/+ieDgYPTv3x+3bt0yON6MGTMwefJkxMXFITg4GFu3bkVERATmzZuHuLg4zJ8/H7NmzTJoTmzoqI8TIYSQBk2nY9gVm4rMPA18HP83nY/MUgQfiQwJ6bnYHXsPrZxtamS8sP3790Mm0w+vkZeXB2dnZ+zfvx8CgQDbtm2DTqfD2rVr+bg2bNgApVKJ6Oho9O7dG0qlEgDg5OTE73Px4sWYPn06hg0bBgD4z3/+g+PHj2PZsmX45ptv+HJTpkxBaGgo/3r27NlYsmQJv8zLyws3btzA6tWrER4eXu3nXhdR4kQIISZWoNGi/8rTAIBfPuhGzXVmlvwoj5/G5+mxfziOg7NCilvpOUh+lFcj44e98sorWLVqFQDg8ePH+Pbbb9GnTx+cP38eV69eRUJCQqkbiwoLC/m+TU/Lzs7G/fv38dJLLxksf+mll3D16lWDZZ06/W/uz7y8PCQmJmLs2LEYN24cv7y4uBgKRd0Yld8UKHEihBATY2C4lZ7LPyfmlVNYDHWRDlJF2QmsVCzEw2wdcgqLa+T41tbWBndxr127FgqFAmvWrEFubi46duzI9z96koODQ7Ucu0Rurv4zuWbNmlJD51TnlCV1HSVOhBBCGjS5pQgSCwEKNFrILEt/LRZotJBYCCAvY11N4DgOAoEABQUF8Pf3x44dO+Do6Gj01CA2NjZwcXFBTEwMAgMD+eUxMTHo0qVLuds1btwYLi4uuH37NkaMGPHc51FfVapzOGMM48ePh62tLTiOq3CASFMZPXo0DfRFCCGkyjztrOHjKEOaqqDUIMSMMaSpCuDrKIennXU5e3g+arUaDx48wIMHDxAXF4cPP/wQubm56NevH0aMGAF7e3sMGDAAp06dQlJSEqKjozFp0iSkpqaWu89p06bhP//5D3bs2IH4+HjMmDEDV65cweTJkyuMJTIyEgsWLMCKFStw8+ZNXLt2DRs2bMBXX31V3addZ1UqfT506BA2btyI6OhoeHt7w97evqbiqhU8PT0xZcoUTJkyxdyhNCw0wW+9V9cn6SX1i0DAYbC/G+49LuD7OknFQhRotEhTFcDWWoxQf9ca+4weOnQIzs7OAPQDJbdo0QI///wzevToAQA4efIkpk+fjtDQUOTk5MDV1RVBQUEV1kBNmjQJKpUKH3/8MdLT09GqVSv88ssv8PX1rTCWd955B1ZWVvjyyy8xbdo0WFtbo23btvQ9+IRKJU6JiYlwdnbGiy++WFPxmIRGo4FYLDZ3GNWmqKiIn7Klzrt5GDg2F3icBDAtwAmBRl5AUATQrLe5oyPV4Po9FXbFpiIhPRfqIh0kFgL4OMow2N8NbVypAyoxjzauCkwK8uU/mw+z9Z9NPzclQv1da+yzuXHjRmzcuLHCMk5OThUOBzBw4MBSNWUCgQCzZ8/G7Nmzy9zG09Oz3Cm+wsLCEBYWVnHgDZjRTXWjR4/Ghx9+iJSUFHAcB09PzwrL9+jRA5MmTcKnn34KW1tbODk5Yc6cOQZlsrKy8M4778DBwQE2Njbo2bOnQY//OXPmoH379li9ejWaNGkCKysrDBkyBCpV6fE0Fi9eDGdnZ9jZ2WHixIkGI6B6enoiKioKo0aNgo2NDcaPHw8A2LVrF1q3bg2JRAJPT08sWbLEIP47d+7go48+AsdxBndaVLTd3Llz4eLigkePHvHL+vbti1deeQU6na7iNxn6tu1Vq1ahT58+kEql8Pb2xs6dO/n19XrQspuHgd3jgMwEQCgBxHL9z8xE/fKbh80dIXlOtWWsHELK0sZVgVl9WyGyf2t83rclIvu3xv/1bUkJPTFgdOK0fPlyfhTStLQ0XLhw4ZnbbNq0CdbW1jh37hwWLVqEuXPn4siRI/z6N998E+np6Th48CAuXboEf39/BAUFITMzky+TkJCAn376Cb/++isOHTqEy5cv4/333zc4zvHjx5GYmIjjx49j06ZNZWbwixcvRrt27XD58mXMmjULly5dwpAhQzBs2DBcu3YNc+bMwaxZs/jtdu/eDTc3N8ydO9dgULFnbff555/D09MT77zzDgDgm2++wR9//IFNmzZBIDDu7Z41axYGDx6Mq1evYsSIERg2bBji4uIMytS7Qct0Wn1Nk1YNiG0AoQXACfQ/xXJAqwF+j9KXI3XS02PlyCxFEAo4/Vg5jjJk5mmwO/aeSaa4MDcOHFyVUrgqpTTlSi0jEHDwdpChXRMlvB1k1IRMSmOVsHTpUubh4WFU2cDAQNatWzeDZZ07d2bTp09njDF26tQpZmNjwwoLCw3KNG3alK1evZoxxtjs2bOZUChkqamp/PqDBw8ygUDA0tLSGGOMhYeHMw8PD1ZcXMyXefPNN9nQoUP51x4eHmzgwIEGxwkLC2OvvvqqwbJp06axVq1aGWy3dOnSSm+XmJjI5HI5mz59OpNKpWzr1q1lvENlA8Dee+89g2Vdu3ZlEyZMYIwxlpSUxACwZcuWGZRp2rQp27Ztm8GyqKgoFhAQUO6xCgsLmUql4h93795lAJhKpTI63mpz5yxj81wYW+jF2JfNSj8WeunX3zlr+thItUhMz2Ej155lH2yNZTN2/Vnq8cHWWDZy7VmWmJ5j7lBJHVRQUMBu3LjBCgoKzB0KqSUq+kyoVKoqf9/V6JQrT8/s7OzsjPT0dADA1atXkZubCzs7O8hkMv6RlJRkMKiXu7s7XF1d+dcBAQHQ6XSIj4/nl7Vu3dpgjIknj1PiyUG+AP1s0mUNDnbr1i1oteXXahiznbe3NxYvXoz//Oc/6N+/f6XbigMCAkq9frrGqbxBy558L7/44otyB0gDgAULFkChUPCPJk2aVCrOapWXoe/TVF4ncIEQYDp9OVIn8WPllDPYo1QshLqo5sbKIYSQ6lCjg1I83WGZ4zi+n09ubi6cnZ0RHR1daruS4eOr4zglnhzkyxROnjwJoVCI5ORkFBcXQySq3re6OgYtmzlzJqZOncq/zs7ONl/yZO2g7wiu0wLCMvJ5nVbfdGf9/AO+EfOobWPlEEJIVZhtkl9/f388ePAAIpEIPj4+Bo8nhzlISUnB/fv3+ddnz56FQCBA8+bNn+v4LVu2RExMjMGymJgYNGvWjE82xGJxqdonY7bbsWMHdu/ejejoaKSkpCAqKqpSsZ09e7bU65YtW5Zb/slBy55+L728vMrdTiKRwMbGxuBhNm6d9HfPFRcAT9/pwZh+ua23vhypk8w9Vk5tUlikn3Kl/8rTKCyifnuE1CVm+9euV69eCAgIwMCBA7Fo0SI0a9YM9+/fx4EDBzBo0CC+KcrS0hLh4eFYvHgxsrOzMWnSJAwZMsRgMsOq+Pjjj9G5c2dERUVh6NChOHPmDFauXGlwJ5qnpydOnjyJYcOGQSKRwN7e/pnbpaamYsKECfjPf/6Dbt26YcOGDXj99dfRp08fvPDCC0bF9vPPP6NTp07o1q0btm7divPnz2PdunUVbhMZGYlJkyZBoVAgJCQEarUaFy9exOPHjw1qlWotgVA/5MDucYAmBxBJ9ct0Wn3SJBQDPWfReE51mLnHyqlNdIzhz1QV/5wQUneYrcaJ4zj897//Rffu3fH222+jWbNmGDZsGO7cuYPGjRvz5Xx8fBAaGorXXnsNvXv3hp+fX7XcZu/v74+ffvoJ27dvR5s2bRAREYG5c+di9OjRfJm5c+ciOTkZTZs25ecEqmg7xhhGjx6NLl264IMPPgAABAcHY8KECRg5ciTfpPYskZGR2L59O/z8/LB582b8+OOPaNWqVYXbvPPOO1i7di02bNiAtm3bIjAwEBs3bqywxqnWadYbCF0D2DbV312nydX/tPPRL6dxnOq8krFy2ropkFWgQfI/ecgq0MDPTYlJQb502zchpNbj2NN15rXInDlzsHfv3loxtYupcByHPXv2mGUamezsbCgUCqhUKvM229HI4fVeQx85PF9TjFYRvwEAbswNhpWY+nU9r8LCQiQlJcHLywuWlpbmDofUAhV9Jp7n+85sNU6ElEsgBNy7Ai1f1/+kpKneobFyCDEeM9M8sfHx8XByckJOTo5JjlcZw4YNMxh82pSqlDilpKQY3Pb+9CMlJaW646wXtm7dWu571rp1a3OHRwghxEzOnDkDoVCIvn37llpXMk/s/v37kZaWhjZt2oDjOOzdu7dGY5o5cyY+/PBDyOVyAEB0dDQ4jkNWVpbB65JH48aNMXjwYNy+fbvUurIe3333HTiOK3VD1AsvvABLS0sUFhbyywoLC2Fpacn39/2///s/zJs3r8yZRGpaleqHXVxcKsx4XVxcqhqPgTlz5pSapqUu69+/f6nhAkqUDKlQi1tOCSGk/jNTV4F169bhww8/xLp163D//n2D79GanCe2vLlOU1JSsH//fnz99dfP3Ed8fDzkcjlu3bqF8ePHo1+/foiNjeVn3ACAyZMnIzs7Gxs2bOCX2draIjIyEtHR0fzNUzk5OYiNjUXjxo1x9uxZfqLjM2fOQK1Wo2fPngCANm3aoGnTptiyZQsmTpz4PG9BpVUpcSoZQoBUjlwu5zN3QkjDZmtdfyYarzfMNMl4bm4uduzYgYsXL+LBgwfYuHEjPvvsMwD6eWJLps7iOA4eHh78doMGDQIAeHh4IDk5GQCwb98+REZG4saNG3BxcUF4eDg+//xzfixBjuPw7bff4uDBgzh27BimTZtWZgXFTz/9hHbt2hkMQF0eR0dHKJVKODs7IyIiAiNGjEBycrLBsEFSqRRqtbrUHfGvvPIKoqOjMWPGDADA6dOn0axZM3Tv3h3R0dF84hQdHQ0PDw+DG5769euH7du3mzxxoj5OhBBiYlZiEWJnvYrYWa9Sx/DawoyTjP/0009o0aIFmjdvjpEjR2L9+vV860NZ88SWzBW7YcMGg7ljT506hVGjRmHy5Mm4ceMGVq9ejY0bN2LevHkGx5szZw4GDRqEa9euYcyYMWXGdOrUqVIzbhhDKpUCADQajVHlX3nlFZw+fRrFxfoZA44fP44ePXogMDAQx48f58sdP34cr7zyisG2Xbp0wfnz56FWqysd5/OgxIkQQkjDZuZJxtetW4eRI0cCAEJCQqBSqXDixAkAgEKhgFwuh1AohJOTExwcHPjhcZRKJb8M0A9lM2PGDISHh8Pb2xuvvvoqoqKisHr1aoPjhYWF4e2334a3tzfc3d3LjOnOnTuV7naTlpaGxYsXw9XV1ehBql955RXk5eXxyV90dDQCAwPRvXt3nDt3DoWFhSgoKMD58+dLJU4uLi7QaDR48OBBpeJ8XvSvDiGEkIYt9aK+eU5kBXBP3eHJcfoBeTNv68u5l91Ptari4+Nx/vx57NmzB4C+K8zQoUOxbt06vpnKWFevXkVMTIxBDZNWq0VhYSHy8/NhZWUFoPTcrWUpKCgwelgHNzc3MMaQn5+Pdu3aYdeuXRCLjWuK9vHxgZubG6Kjo9G6dWtcvnwZgYGBcHR0hLu7O86cOQPGGNRqdanEqaR2Kz8/36hjVRdKnAghxMQKi7QIX38eALBpTBdYWtCQG2ZlzCTjxTUzyfi6detQXFxsULvDGINEIsHKlSuhUBg/KGxubi4iIyMRGhpaat2TSZAxc7fa29vj8ePHRh331KlTsLGxgaOjY5X68fbo0QPHjx+Hn58ffH194ejoCAB8cx1jDD4+PqXmUs3MzAQAvsbNVChxIoQQE9MxhnNJmfxzYmZmmmS8uLgYmzdvxpIlS9C7t2Hn84EDB+LHH3/Ee++9V+a2FhYWpeZS9ff3R3x8fLXcvNWhQwfcuHHDqLJeXl5QKpVVPtYrr7yCSZMmoVWrVga1bN27d8eaNWvAGCtV2wQA169fh5ubm8H8tqZAfZwIIYQ0bGaaZHz//v14/Pgxxo4dizZt2hg8Bg8eXOEcpZ6enjh27BgePHjA1wxFRERg8+bNiIyMxF9//YW4uDhs374d//d//1fp2IKDg3HmzJlSyVlNKOnntH79egQGBvLLAwMDce7cuTL7NwH6mq6nE05ToMSJEEJIw1YyybhQrJ9kXFsEMJ3+pyanxiYZX7duHXr16lVmc9zgwYNx8eJF/Pnnn2Vuu2TJEhw5cgRNmjRBhw4dAOiTnf379+Pw4cPo3LkzXnjhBSxdutRgCANj9enTByKRCEePHq30tpXl5eUFDw8P5OTkGCRO7u7ufAfwp/t7FRYWYu/evRg3blyNx/e0Wj1XHTGtWjNXHSH1HM1VV/2qZa46g3GcdPrmOVtvfdLUACcZ/+abb/DLL7/gt99+M3copaxatQp79uzB4cPlDxNRU3PVNbjfVsYY3n33XezcuROPHz/G5cuX0b59e6O379GjB9q3b49ly5bVWIz1Bk3WaxINfcJcQqpNs96ATxD93frXu+++i6ysLOTk5NS6wZstLCyMGtW8JjS4xKlkzp/o6Gh4e3ubvFNZg2GmEXgbmuv3VNgVm4qE9Fyoi3SQWAjg4yjDYH83tHE1/m4cQsi/SiYZJxCJRPj888/NHUaZ3nnnHbMdu8H1cXpyzh8nJyd+GPq6zNgRWk3GjCPwNiTX76mw4tgtXEtVQSkVw9PeGkqpGNdS9cuv3zP95JfEeFILIaQ0DAEhdU6DSpxGjx6NDz/8ECkpKeA4Dp6enhWWz8vLw6hRoyCTyeDs7IwlS5aUKuPp6YkvvviCL+fh4YFffvkFGRkZGDBgAGQyGfz8/HDx4kWjYty4cSOUSiX27t0LX19fWFpaIjg4GHfv3uXLzJkzB+3bt8fatWsN2m6zsrLwzjvvwMHBATY2NujZsyeuXr1q/BtUHcw8Am9DodMx7IpNRWaeBj6OMsgsRRAKOMgsRfBxlCEzT4Pdsfeg01EXxtrISixCXFQI4qJCqH8TIXVMg0qcyprzpyLTpk3DiRMnsG/fPhw+fBjR0dGIjY0tVW7p0qV46aWXcPnyZfTt2xdvvfUWRo0ahZEjRyI2NhZNmzbFqFGjYGw//Pz8fMybNw+bN29GTEwMsrKyMGzYMIMyCQkJ2LVrF3bv3o0rV64AAN58802kp6fj4MGDuHTpEvz9/REUFMQPEvY0tVqN7Oxsg8dzq8wIvKTKkh/lISE9F84KKbin3meO4+CskOJWeg6SH+WZKUJCCKmfGtS/Ok/P+VOR3NxcrFu3Dlu2bEFQUBAAYNOmTXBzcytV9rXXXsO7774LQD+OxqpVq9C5c2e8+eabAIDp06cjICAADx8+fOZxAaCoqAgrV65E165d+eO2bNkS58+fR5cuXQDom+c2b97Mj5h6+vRpnD9/Hunp6ZBIJACAxYsXY+/evdi5cyfGjx9f6jgLFixAZGTkM+OpFDOOwNuQ5BQWQ12kg1RR9vssFQvxMFuHnMJiE0dGiHnRjeKkhE6nq5H9NqjEqTISExOh0Wj45AUAbG1ty5y40M/Pj3/euHFjAEDbtm1LLUtPTzcqcRKJROjcuTP/ukWLFlAqlYiLi+MTJw8PD4Nh5q9evYrc3FzY2dkZ7KugoACJiYllHmfmzJmYOnUq/zo7O7vUkPaVZqYReBsauaUIEgsBCjRayCxL/xoXaLSQWAggL2MdMb/CIi0mbLkEAFg1siNNuVINLCwswHEcMjIy4ODgUKomljQcjDFoNBpkZGRAIBAYPW+eseivajWwsLDgn5f8spa1rDqz36fnGsrNzYWzszOio6NLlS1vKHyJRMLXTlWbkhF4MxMBgciwua5kBF47n2ofgbeh8bSzho+jDNdSVfCRyAy+JBhjSFMVwM9NCU+7Z89JRUxPxxiOx2fwz8nzEwqFcHNzQ2pqKpKTk80dDqkFrKys4O7uDoGgenslUeJUjqZNm8LCwgLnzp2Du7s7AODx48e4efOmwcimNaG4uBgXL17ka5fi4+ORlZWFli1blruNv78/Hjx4AJFI9MxO7zWqZATe3eP0I+6KpPplOq0+aaqhEXgbGoGAw2B/N9x7XMD3dZKKhSjQaJGmKoCttRih/q40nhNpUGQyGXx9fVFUVGTuUIiZCYVCiESiGql5pMSpHDKZDGPHjsW0adNgZ2cHR0dHfP7559WeuZbFwsICH374IVasWAGRSIQPPvgAL7zwAp9IlaVXr14ICAjAwIEDsWjRIjRr1gz379/HgQMHMGjQIHTqZMIanma9gdA1/xvHqfjfEXjtfBrsCLw1oY2rApOCfPlxnB5m68dx8nNTItTflcZxIg2SUCiEUEj/mJGaQ4lTBb788kvk5uaiX79+kMvl+Pjjj6FS1fzYOFZWVpg+fTrCwsJw7949vPzyyxVO9gjomwP/+9//4vPPP8fbb7+NjIwMODk5oXv37nwfK5OiEXhNoo2rAq2cbWjkcEIIMRGaq66W2bhxI6ZMmYKsrCyTH5vmqiPENGiuOkLM63m+7xrUOE6EEEIIIc+jwf6bk5KSglatWpW7/saNG3yn8OrUp08fnDp1qsx1n332GVxcXKr9mMYqqXysloEwCSHlytcUQ6fOB6D/fSumGidCTKrke64qjW4NtqmuuLi4wltWPT09a2Qeu3v37qGgoKDMdba2trC1ta32YxorNTX1+cdxIoQQQuqIu3fvljmwdUUabOJEStPpdLh//z7kcrlRt3CWDJh59+7detEnis6ndqPzqf3q2znR+dRuz3M+jDHk5OTAxcWl0nfLU/0w4QkEgkpn3gBgY2NTL34JS9D51G50PrVffTsnOp/ararno1BUbcgW6hxOCCGEEGIkSpwIIYQQQoxEiROpMolEgtmzZ1f/fHdmQudTu9H51H717ZzofGo3c50PdQ4nhBBCCDES1TgRQgghhBiJEidCCCGEECNR4kQIIYQQYiRKnAghhBBCjESJUwP2zTffwNPTE5aWlujatSvOnz9fYfmff/4ZLVq0gKWlJdq2bYv//ve/BusZY4iIiICzszOkUil69eqFW7duGZTJzMzEiBEjYGNjA6VSibFjxyI3N7fWnU9RURGmT5+Otm3bwtraGi4uLhg1ahTu379vsA9PT09wHGfwWLhwYa07HwAYPXp0qVhDQkIMytSV6wOg1LmUPL788ku+TG25Pn/99RcGDx7Mx7Ns2bIq7bOwsBATJ06EnZ0dZDIZBg8ejIcPH1bL+dTEOS1YsACdO3eGXC6Ho6MjBg4ciPj4eIMyPXr0KHWN3nvvvVp5PnPmzCkVa4sWLQzK1OQ1qu7zKev3g+M4TJw4kS9TW67PmjVr8PLLL6NRo0Zo1KgRevXqVaq8yb6DGGmQtm/fzsRiMVu/fj3766+/2Lhx45hSqWQPHz4ss3xMTAwTCoVs0aJF7MaNG+z//u//mIWFBbt27RpfZuHChUyhULC9e/eyq1evsv79+zMvLy9WUFDAlwkJCWHt2rVjZ8+eZadOnWI+Pj5s+PDhte58srKyWK9evdiOHTvY33//zc6cOcO6dOnCOnbsaLAfDw8PNnfuXJaWlsY/cnNza935MMZYeHg4CwkJMYg1MzPTYD915fowxgzOIy0tja1fv55xHMcSExP5MrXl+pw/f5598skn7Mcff2ROTk5s6dKlVdrne++9x5o0acKOHTvGLl68yF544QX24osvPvf51NQ5BQcHsw0bNrDr16+zK1eusNdee425u7sbXIPAwEA2btw4g2ukUqlq5fnMnj2btW7d2iDWjIwMgzI1dY1q4nzS09MNzuXIkSMMADt+/DhfprZcn7CwMPbNN9+wy5cvs7i4ODZ69GimUChYamoqX8ZU30GUODVQXbp0YRMnTuRfa7Va5uLiwhYsWFBm+SFDhrC+ffsaLOvatSt79913GWOM6XQ65uTkxL788kt+fVZWFpNIJOzHH39kjDF248YNBoBduHCBL3Pw4EHGcRy7d+9erTqfspw/f54BYHfu3OGXeXh4lPkH6XnVxPmEh4ezAQMGlHvMun59BgwYwHr27GmwrLZcH2NietY+s7KymIWFBfv555/5MnFxcQwAO3PmzHOcjXHHr4ix73N6ejoDwE6cOMEvCwwMZJMnT65KyBWqifOZPXs2a9euXbnb1eQ1MsX1mTx5MmvatCnT6XT8stp4fRhjrLi4mMnlcrZp0ybGmGm/g6iprgHSaDS4dOkSevXqxS8TCATo1asXzpw5U+Y2Z86cMSgPAMHBwXz5pKQkPHjwwKCMQqFA165d+TJnzpyBUqlEp06d+DK9evWCQCDAuXPnatX5lEWlUoHjOCiVSoPlCxcuhJ2dHTp06IAvv/wSxcXFVT4XoGbPJzo6Go6OjmjevDkmTJiAR48eGeyjrl6fhw8f4sCBAxg7dmypdbXh+lTHPi9duoSioiKDMi1atIC7u3uVj1uZ41cHlUoFALC1tTVYvnXrVtjb26NNmzaYOXMm8vPzn+s4NXk+t27dgouLC7y9vTFixAikpKTw62rqGpni+mg0GmzZsgVjxowpNcl7bbw++fn5KCoq4j9LpvwOokl+G6B//vkHWq0WjRs3NljeuHFj/P3332Vu8+DBgzLLP3jwgF9fsqyiMo6OjgbrRSIRbG1t+TK15XyeVlhYiOnTp2P48OEGk0lOmjQJ/v7+sLW1xR9//IGZM2ciLS0NX331Va07n5CQEISGhsLLywuJiYn47LPP0KdPH5w5cwZCobBOX59NmzZBLpcjNDTUYHltuT7Vsc8HDx5ALBaXStwrel+q8/jPS6fTYcqUKXjppZfQpk0bfnlYWBg8PDzg4uKCP//8E9OnT0d8fDx2795d5WPV1Pl07doVGzduRPPmzZGWlobIyEi8/PLLuH79OuRyeY1dI1Ncn7179yIrKwujR482WF5br8/06dPh4uLCJ0qm/A6ixImQZygqKsKQIUPAGMOqVasM1k2dOpV/7ufnB7FYjHfffRcLFiyoddMaDBs2jH/etm1b+Pn5oWnTpoiOjkZQUJAZI3t+69evx4gRI2BpaWmwvC5dn/pu4sSJuH79Ok6fPm2wfPz48fzztm3bwtnZGUFBQUhMTETTpk1NHWaF+vTpwz/38/ND165d4eHhgZ9++qnM2s66ZN26dejTpw9cXFwMltfG67Nw4UJs374d0dHRpX7nTYGa6hoge3t7CIXCUnd6PHz4EE5OTmVu4+TkVGH5kp/PKpOenm6wvri4GJmZmeUe11znU6Ikabpz5w6OHDliUNtUlq5du6K4uBjJycmVP5F/1eT5PMnb2xv29vZISEjg91HXrg8AnDp1CvHx8XjnnXeeGYu5rk917NPJyQkajQZZWVnVdtzKHP95fPDBB9i/fz+OHz8ONze3Cst27doVAPjPZVXU9PmUUCqVaNasmcHvUE1co5o+nzt37uDo0aNG/w4B5rs+ixcvxsKFC3H48GH4+fnxy035HUSJUwMkFovRsWNHHDt2jF+m0+lw7NgxBAQElLlNQECAQXkAOHLkCF/ey8sLTk5OBmWys7Nx7tw5vkxAQACysrJw6dIlvszvv/8OnU7H/zLWlvMB/pc03bp1C0ePHoWdnd0zY7ly5QoEAkGp6uDKqKnzeVpqaioePXoEZ2dnfh916fqUWLduHTp27Ih27do9MxZzXZ/q2GfHjh1hYWFhUCY+Ph4pKSlVPm5ljl8VjDF88MEH2LNnD37//Xd4eXk9c5srV64AAP+5rIqaOp+n5ebmIjExkY+1pq5RTZ/Phg0b4OjoiL59+z6zrDmvz6JFixAVFYVDhw4Z9FMCTPwdZHQ3clKvbN++nUkkErZx40Z248YNNn78eKZUKtmDBw8YY4y99dZbbMaMGXz5mJgYJhKJ2OLFi1lcXBybPXt2mcMRKJVKtm/fPvbnn3+yAQMGlHkraIcOHdi5c+fY6dOnma+vb7Xd7l6d56PRaFj//v2Zm5sbu3LlisGtuGq1mjHG2B9//MGWLl3Krly5whITE9mWLVuYg4MDGzVqVK07n5ycHPbJJ5+wM2fOsKSkJHb06FHm7+/PfH19WWFhIb+funJ9SqhUKmZlZcVWrVpV6pi16fqo1Wp2+fJldvnyZebs7Mw++eQTdvnyZXbr1i2j98mY/lZ3d3d39vvvv7OLFy+ygIAAFhAQ8NznU1PnNGHCBKZQKFh0dLTB71B+fj5jjLGEhAQ2d+5cdvHiRZaUlMT27dvHvL29Wffu3Wvl+Xz88ccsOjqaJSUlsZiYGNarVy9mb2/P0tPT+TI1dY1q4nwY09/N5u7uzqZPn17qmLXp+ixcuJCJxWK2c+dOg89STk6OQRlTfAdR4tSAff3118zd3Z2JxWLWpUsXdvbsWX5dYGAgCw8PNyj/008/sWbNmjGxWMxat27NDhw4YLBep9OxWbNmscaNGzOJRMKCgoJYfHy8QZlHjx6x4cOHM5lMxmxsbNjbb79t8MGvLeeTlJTEAJT5KBnj5NKlS6xr165MoVAwS0tL1rJlSzZ//nyDRKS2nE9+fj7r3bs3c3BwYBYWFszDw4ONGzfO4EuZsbpzfUqsXr2aSaVSlpWVVWpdbbo+5X2eAgMDjd4nY4wVFBSw999/nzVq1IhZWVmxQYMGsbS0tGo5n5o4p/J+hzZs2MAYYywlJYV1796d2draMolEwnx8fNi0adOqZZygmjifoUOHMmdnZyYWi5mrqysbOnQoS0hIMDhmTV6jmvjM/fbbbwxAqb/VjNWu6+Ph4VHm+cyePZsvY6rvII4xxoyvnyKEEEIIabiojxMhhBBCiJEocSKEEEIIMRIlToQQQgghRqLEiRBCCCHESJQ4EUIIIYQYiRInQgghhBAjUeJECCGEEGIkSpwIIYQQQoxEiRMhhFRBdHQ0PD09zR0GACA5ORkcx5k7DEIaBEqcCCGkGpw4cQI9e/aEra0trKys4Ovri/DwcGg0GgD6RIvjODRq1AiFhYUG2164cAEcxxkkPyXlOY6DQCCAQqFAhw4d8OmnnyItLc2k50YI+R9KnAgh5DnduHEDISEh6NSpE06ePIlr167h66+/hlgshlarNSgrl8uxZ88eg2Xr1q2Du7t7mfuOj4/H/fv3ceHCBUyfPh1Hjx5FmzZtcO3atRo7H0JI+ShxIoSQ53T48GE4OTlh0aJFaNOmDZo2bYqQkBCsWbMGUqnUoGx4eDjWr1/Pvy4oKMD27dsRHh5e5r4dHR3h5OSEZs2aYdiwYYiJiYGDgwMmTJhQo+dECCkbJU6EEPKcnJyckJaWhpMnTz6z7FtvvYVTp04hJSUFALBr1y54enrC39/fqGNJpVK89957iImJQXp6+nPFTQipPEqcCCHkOb355psYPnw4AgMD4ezsjEGDBmHlypXIzs4uVdbR0RF9+vTBxo0bAQDr16/HmDFjKnW8Fi1aANB3CieEmBYlToQQ8pyEQiE2bNiA1NRULFq0CK6urpg/fz5at25dZkfuMWPGYOPGjbh9+zbOnDmDESNGVOp4jDEAoDvpCDEDSpwIIaSauLq64q233sLKlSvx119/obCwEN99912pcn369EFBQQHGjh2Lfv36wc7OrlLHiYuLA4BaMxwCIQ0JJU6EEFIDGjVqBGdnZ+Tl5ZVaJxKJMGrUKERHR1e6ma6goADff/89unfvDgcHh+oKlxBiJJG5AyCEkLpu9erVuHLlCgYNGoSmTZuisLAQmzdvxl9//YWvv/66zG2ioqIwbdq0Z9Y2paeno7CwEDk5Obh06RIWLVqEf/75B7t3766JUyGEPAMlToQQ8py6dOmC06dP47333sP9+/chk8nQunVr7N27F4GBgWVuIxaLYW9v/8x9N2/eHBzHQSaTwdvbG71798bUqVPh5ORU3adBCDECx0p6GRJCCDFadHQ0Ro8eXSvubEtOToaXlxfozzkhNY/6OBFCCCGEGIkSJ0IIIYQQI1HiRAghVeDp6YkpU6aYOwwAgFKpxOzZs80dBiENAvVxIoQQQggxEtU4EUIIIYQYiRInQgghhBAjUeJECCGEEGIkSpwIIYQQQoxEiRMhhBBCiJEocSKEEEIIMRIlToQQQgghRqLEiRBCCCHESP8PEVAIUVX7qdQAAAAASUVORK5CYII=\n",
            "text/plain": [
              "<Figure size 600x300 with 1 Axes>"
            ]
          },
          "metadata": {},
          "output_type": "display_data"
        }
      ],
      "source": [
        "import numpy as np, pandas as pd\n",
        "from sklearn.metrics import roc_auc_score, brier_score_loss\n",
        "import matplotlib.pyplot as plt\n",
        "\n",
        "# ① 공변량별 SMD(before/after) 계산\n",
        "def smd_table(dfc, covs, sw=None):\n",
        "    def _smd(x, t, w=None):\n",
        "        x=np.asarray(x,float); t=np.asarray(t,int); w=np.ones_like(t,float) if w is None else np.asarray(w,float)\n",
        "        m1=np.average(x[t==1],weights=w[t==1]); m0=np.average(x[t==0],weights=w[t==0])\n",
        "        v1=np.average((x[t==1]-m1)**2,weights=w[t==1]); v0=np.average((x[t==0]-m0)**2,weights=w[t==0])\n",
        "        return (m1-m0)/np.sqrt((v1+v0)/2+1e-9)\n",
        "    T = dfc[\"vpt_flag\"].astype(int).values\n",
        "    W = None if sw is None else sw\n",
        "    rows=[]\n",
        "    for c in covs:\n",
        "        if c not in dfc.columns: continue\n",
        "        x = pd.to_numeric(dfc[c], errors=\"coerce\").fillna(dfc[c].median())\n",
        "        b = abs(_smd(x, T, None))\n",
        "        a = abs(_smd(x, T, W))\n",
        "        rows.append({\"covariate\":c, \"SMD_before\":b, \"SMD_after\":a})\n",
        "    return pd.DataFrame(rows).sort_values(\"SMD_after\")\n",
        "\n",
        "# ② PS 진단(AUC, Brier, KS)\n",
        "from sklearn.linear_model import LogisticRegression\n",
        "from scipy.stats import ks_2samp\n",
        "\n",
        "def ps_diagnostics(dfc, covs):\n",
        "    X = dfc[covs].apply(pd.to_numeric, errors=\"coerce\").fillna(dfc[covs].median(numeric_only=True))\n",
        "    y = dfc[\"vpt_flag\"].astype(int).values\n",
        "    m = LogisticRegression(max_iter=400, solver=\"lbfgs\", random_state=7).fit(X, y)\n",
        "    ps = m.predict_proba(X)[:,1]\n",
        "    auc = roc_auc_score(y, ps)\n",
        "    bs  = brier_score_loss(y, ps)\n",
        "    ks  = ks_2samp(ps[y==1], ps[y==0]).statistic\n",
        "    return ps, {\"AUC\":auc, \"Brier\":bs, \"KS\":ks}\n",
        "\n",
        "# 사용 예시 (당신 코드의 covset과 동일하게)\n",
        "base_covs = [\"age\",\"sexM\",\"is_emerg\",\"baseline\"]\n",
        "llm_covs  = base_covs + [\"f_ckd_pre\",\"f_dm_pre\",\"f_hf_pre\",\"f_liver_pre\",\"f_nephrotox_pre\"]\n",
        "\n",
        "# BASE\n",
        "ps_base, diag_base = ps_diagnostics(dfc, base_covs)\n",
        "smd_base = smd_table(dfc, base_covs, sw=None)\n",
        "\n",
        "# BASE+LLM (IPTW용 가중치 재계산 필요 시, 당신의 fit_ps_and_sw 사용)\n",
        "from math import inf\n",
        "_, ps_llm, sw_llm, ESS_llm = fit_ps_and_sw(dfc, llm_covs)\n",
        "_, diag_llm = ps_diagnostics(dfc, llm_covs)\n",
        "smd_llm_w = smd_table(dfc, llm_covs, sw=sw_llm)\n",
        "\n",
        "print(\"PS AUC: BASE vs LLM →\", diag_base[\"AUC\"], \"vs\", diag_llm[\"AUC\"])\n",
        "print(\"PS KS:  BASE vs LLM →\", diag_base[\"KS\"],  \"vs\", diag_llm[\"KS\"])\n",
        "print(\"ESS(LLM):\", ESS_llm)\n",
        "\n",
        "# 간단 Love plot (after)\n",
        "plt.figure(figsize=(6, max(3, len(smd_llm_w)*0.25)))\n",
        "y = np.arange(len(smd_llm_w))\n",
        "plt.scatter(smd_llm_w[\"SMD_before\"], y, label=\"Before\", alpha=0.6)\n",
        "plt.scatter(smd_llm_w[\"SMD_after\"],  y, label=\"After (IPTW)\", alpha=0.9)\n",
        "plt.axvline(0.1, ls=\"--\")\n",
        "plt.yticks(y, smd_llm_w[\"covariate\"])\n",
        "plt.xlabel(\"|SMD|\"); plt.legend(); plt.title(\"Love plot (BASE+LLM)\")\n",
        "plt.tight_layout(); plt.show()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "5jhchW-g8Pil"
      },
      "outputs": [],
      "source": [
        "from joblib import Parallel, delayed\n",
        "import numpy as np\n",
        "import pandas as pd\n",
        "from sklearn.linear_model import LogisticRegression\n",
        "from lifelines import CoxPHFitter\n",
        "\n",
        "def _iptw_loghr_numpy(dfc, covs, RANDOM_STATE=7, ps_clip=(1e-3, 1-1e-3), w_trim=(0.01,0.99)):\n",
        "    \"\"\" dfc, covs -> stabilized IPTW weights -> Cox(log HR) \"\"\"\n",
        "    # 넘파이 설계행렬\n",
        "    T = dfc[\"vpt_flag\"].to_numpy(dtype=int)\n",
        "    time  = pd.to_numeric(dfc[\"duration_days\"], errors=\"coerce\").to_numpy()\n",
        "    event = dfc[\"event_observed\"].astype(int).to_numpy()\n",
        "\n",
        "    X = dfc[covs].apply(pd.to_numeric, errors=\"coerce\")\n",
        "    X = X.fillna(X.median(numeric_only=True))\n",
        "    X = X.to_numpy()\n",
        "\n",
        "    # PS\n",
        "    lr = LogisticRegression(max_iter=200, solver=\"lbfgs\", random_state=RANDOM_STATE, warm_start=True)\n",
        "    lr.fit(X, T)\n",
        "    ps = lr.predict_proba(X)[:,1].clip(*ps_clip)\n",
        "\n",
        "    # Stabilized weights + trim\n",
        "    p_t = float(T.mean())\n",
        "    sw = np.where(T==1, p_t/ps, (1-p_t)/(1-ps))\n",
        "    lo, hi = np.quantile(sw, w_trim)\n",
        "    sw = np.clip(sw, lo, hi)\n",
        "\n",
        "    # Cox (lifelines는 DF 필요)\n",
        "    df_small = pd.DataFrame({\n",
        "        \"time\": time,\n",
        "        \"event\": event,\n",
        "        \"treat\": T,\n",
        "        \"sw\": sw\n",
        "    })\n",
        "    cph = CoxPHFitter(penalizer=0.1)\n",
        "    cph.fit(df_small, duration_col=\"time\", event_col=\"event\", weights_col=\"sw\", robust=True)\n",
        "    logHR = float(cph.params_[\"treat\"])\n",
        "    return logHR\n",
        "\n",
        "def _one_boot(idx, dfc, base_covs, llm_covs, use_subsample=False, m_frac=0.7, seed=7):\n",
        "    rng = np.random.default_rng(seed + idx*13)\n",
        "    n = len(dfc)\n",
        "    if use_subsample:\n",
        "        m = max(50, int(m_frac*n))\n",
        "        take = rng.integers(0, n, m)\n",
        "    else:\n",
        "        take = rng.integers(0, n, n)\n",
        "    d = dfc.iloc[take].reset_index(drop=True)\n",
        "\n",
        "    logHR_b = _iptw_loghr_numpy(d, base_covs)\n",
        "    logHR_l = _iptw_loghr_numpy(d, llm_covs)\n",
        "    return (logHR_l - logHR_b)\n",
        "\n",
        "def bootstrap_hr_diff_fast(\n",
        "    dfc, base_covs, llm_covs, B=300, n_jobs=-1,\n",
        "    use_subsample=False, m_frac=0.7, seed=7\n",
        "):\n",
        "    diffs = Parallel(n_jobs=n_jobs, backend=\"loky\", verbose=0)(\n",
        "        delayed(_one_boot)(b, dfc, base_covs, llm_covs, use_subsample, m_frac, seed)\n",
        "        for b in range(B)\n",
        "    )\n",
        "    diffs = np.array(diffs, float)\n",
        "    ci_lo, ci_hi = np.percentile(diffs, [2.5, 97.5])\n",
        "    p_two = 2 * min((diffs<=0).mean(), (diffs>=0).mean())\n",
        "    return {\n",
        "        \"mean_diff_logHR\": float(diffs.mean()),\n",
        "        \"CI95\": (float(ci_lo), float(ci_hi)),\n",
        "        \"p\": float(p_two),\n",
        "        \"n_boot\": int(B),\n",
        "        \"subsample\": bool(use_subsample),\n",
        "        \"m_frac\": float(m_frac),\n",
        "    }"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "grFLf5zRgF18",
        "outputId": "add42325-6252-4e62-ed57-61eeed445693"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "{'mean_diff_logHR': -0.028217227362732255, 'CI95': (-0.035092348369610366, -0.021293798831406974), 'p': 0.0, 'n_boot': 300, 'subsample': False, 'm_frac': 0.7}\n",
            "{'mean_diff_logHR': -0.028217227362732255, 'CI95': (-0.035092348369610366, -0.021293798831406974), 'p': 0.0, 'n_boot': 300, 'subsample': False, 'm_frac': 0.7}\n"
          ]
        }
      ],
      "source": [
        "base_covs = [\"age\",\"sexM\",\"is_emerg\",\"baseline\"]\n",
        "llm_covs  = base_covs + [\"f_ckd_pre\",\"f_dm_pre\",\"f_hf_pre\",\"f_liver_pre\",\"f_nephrotox_pre\"]\n",
        "\n",
        "# 1) 정확도 우선 (전체 n 부트스트랩, 병렬화)\n",
        "boot = bootstrap_hr_diff_fast(dfc, base_covs, llm_covs, B=300, n_jobs=-1)\n",
        "print(boot)\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "cFOonu2e8RUe",
        "outputId": "9fcf9938-0427-4b41-b6ce-1c8ef19c0801"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "\n",
            "[Treatment ~ LLM confounders] pseudo-R2: 0.007269798443215625\n",
            "===================================================================================\n",
            "                      coef    std err          z      P>|z|      [0.025      0.975]\n",
            "-----------------------------------------------------------------------------------\n",
            "const              -2.5590      0.018   -139.625      0.000      -2.595      -2.523\n",
            "f_ckd_pre           0.2252      0.029      7.805      0.000       0.169       0.282\n",
            "f_dm_pre            0.0196      0.026      0.742      0.458      -0.032       0.071\n",
            "f_hf_pre            0.0582      0.027      2.156      0.031       0.005       0.111\n",
            "f_liver_pre         0.4013      0.028     14.437      0.000       0.347       0.456\n",
            "f_nephrotox_pre    -0.0294      0.031     -0.957      0.338      -0.089       0.031\n",
            "===================================================================================\n",
            "\n",
            "[Outcome ~ Treatment + LLM confounders] pseudo-R2: 0.03569354665073887\n",
            "===================================================================================\n",
            "                      coef    std err          z      P>|z|      [0.025      0.975]\n",
            "-----------------------------------------------------------------------------------\n",
            "const              -2.0291      0.015   -138.845      0.000      -2.058      -2.000\n",
            "f_ckd_pre           0.7014      0.022     32.556      0.000       0.659       0.744\n",
            "f_dm_pre           -0.0080      0.020     -0.409      0.683      -0.047       0.030\n",
            "f_hf_pre            0.3477      0.020     17.734      0.000       0.309       0.386\n",
            "f_liver_pre        -0.0920      0.022     -4.139      0.000      -0.136      -0.048\n",
            "f_nephrotox_pre     0.0729      0.022      3.277      0.001       0.029       0.117\n",
            "vpt_flag            0.5915      0.028     21.405      0.000       0.537       0.646\n",
            "===================================================================================\n"
          ]
        }
      ],
      "source": [
        "import statsmodels.api as sm\n",
        "\n",
        "def assoc_checks(dfc, llm_covs):\n",
        "    Xt = dfc[llm_covs].apply(pd.to_numeric, errors=\"coerce\").fillna(0)\n",
        "    Xt = sm.add_constant(Xt)\n",
        "    mt = sm.Logit(dfc[\"vpt_flag\"].astype(int), Xt).fit(disp=0)\n",
        "    print(\"\\n[Treatment ~ LLM confounders] pseudo-R2:\", mt.prsquared)\n",
        "    print(mt.summary().tables[1])\n",
        "\n",
        "    Xy = pd.concat([dfc[llm_covs], dfc[[\"vpt_flag\"]]], axis=1).apply(pd.to_numeric, errors=\"coerce\").fillna(0)\n",
        "    Xy = sm.add_constant(Xy)\n",
        "    my = sm.Logit(dfc[\"event_observed\"].astype(int), Xy).fit(disp=0)\n",
        "    print(\"\\n[Outcome ~ Treatment + LLM confounders] pseudo-R2:\", my.prsquared)\n",
        "    print(my.summary().tables[1])\n",
        "\n",
        "assoc_checks(dfc, [\"f_ckd_pre\",\"f_dm_pre\",\"f_hf_pre\",\"f_liver_pre\",\"f_nephrotox_pre\"])"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "tpfHI4PGgM48"
      },
      "outputs": [],
      "source": []
    }
  ],
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}