{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/Users/scott/Documents/projects/WAG-Code\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import os\n",
    "import sys\n",
    "from openai import OpenAI\n",
    "import pandas as pd\n",
    "# Change directory up one level\n",
    "os.chdir('../..')\n",
    "print(os.getcwd())\n",
    "from query.base import Base\n",
    "from query.rag import Rag\n",
    "from query.wag import Wag\n",
    "\n",
    "\n",
    "import json\n",
    "from utils.umls import umls\n",
    "from prompt.EntityMerge import ENTITY_MERGE_JSON_PROMPT_ALL\n",
    "from prompt.Context import CONTEXT_PROMPT\n",
    "from openai import OpenAI\n",
    "from dotenv import load_dotenv\n",
    "from langchain_community.utilities import GoogleSerperAPIWrapper\n",
    "from models.entity import Entity\n",
    "from models.relationship import Relationship\n",
    "from utils import parse_llm_response,search_docs\n",
    "from prompt.Query import QUERY_PROMPT_KGRAG, QUERY_PROMPT_BASE\n",
    "import random\n",
    "\n",
    "from retriever import *\n",
    "from collections import defaultdict\n",
    "from itertools import product\n",
    "from scipy.spatial.distance import pdist\n",
    "from tqdm import tqdm  # for progress bar\n",
    "import numpy as np\n",
    "from concurrent.futures import ThreadPoolExecutor\n",
    "\n",
    "\n",
    "\n",
    "\n",
    "load_dotenv()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Resting time\n",
      "Inactive time\n",
      "Active time\n",
      "Lightly active time\n",
      "Moderately active time\n",
      "Highly active time\n",
      "Steps taken\n",
      "Distance traveled\n",
      "Energy expenditure\n",
      "Exercise\n",
      "Step goal\n",
      "Total sleep duration\n",
      "Asleep duration\n",
      "Light sleep duration\n",
      "Deep sleep duration\n",
      "Rem sleep duration\n",
      "Wake after sleep onset\n",
      "Sleep efficiency\n",
      "Bedtime start time\n",
      "Bedtime end time\n",
      "Sleep onset latency\n",
      "Midpoint of sleep\n",
      "Time after wakeup\n",
      "HRV RMSSD\n",
      "Resting heart rate\n",
      "Nightly skin temperature\n",
      "Blood oxygen saturation\n",
      "Sleep breathing rate\n",
      "Temperature Variation\n",
      "VO2 Max\n",
      "Skin conductance\n",
      "PANAS positive affect\n",
      "PANAS negative affect\n",
      "Mental stress\n",
      "Mental fatigue\n",
      "Mood\n",
      "Anxiety\n",
      "Depression\n",
      "Lifelog\n",
      "Number of calls\n",
      "Entropy of call duration\n",
      "Number of phone unlock\n",
      "Duration of phone unlock\n",
      "Time at home\n",
      "The Radius of Gyration\n",
      "Maximum distance from home\n",
      "Circadian rhythm patterns\n",
      "Age\n",
      "Gender\n",
      "Bmi\n",
      "Personality\n",
      "Barometric pressure\n"
     ]
    }
   ],
   "source": [
    "root_dir = 'resources'\n",
    "\n",
    "\n",
    "with open(f\"{root_dir}/kg/nodes_with_embeddings.json\", 'r') as f:\n",
    "    nodes = json.load(f)\n",
    "    for node in nodes:\n",
    "            nodes[node] = Entity.from_dict(nodes[node])\n",
    "\n",
    "\n",
    "with open(f\"{root_dir}/kg/edges.json\", 'r') as f:\n",
    "    edges = json.load(f)\n",
    "    for edge in edges:\n",
    "            edges[edge] = Relationship.from_dict(edges[edge])\n",
    "\n",
    "path_map = {\n",
    "    'pmdata': 'pmdata_df',\n",
    "    'ifh_affect': 'ifh_df',\n",
    "    'globem': 'globem_df',\n",
    "    'lifesnap': 'lifesnap_df',\n",
    "}\n",
    "with open(f'{root_dir}/features_map_dict_with_descriptionv3.json', 'r') as f:\n",
    "    features_map_dict = json.load(f)\n",
    "\n",
    "\n",
    "with open(f'{root_dir}/relationship_dict.json', 'r') as f:\n",
    "    relationship_dict = json.load(f)\n",
    "\n",
    "dataset_metric_dict = {\n",
    "    'lifesnap': [],\n",
    "    'pmdata': [],\n",
    "    'ifh_affect': [],\n",
    "    'globem': []\n",
    "}\n",
    "#get the data associated metrics for each dataset\n",
    "for key, value in features_map_dict.items():\n",
    "    print(key)\n",
    "    # print(value['alias'])\n",
    "    for key2, value2 in value['alias'].items():\n",
    "        if pd.notna(value2):\n",
    "            # node_name = key[0].upper() + key[1:]\n",
    "            dataset_metric_dict[key2].append(key)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Heart rate\n",
      "Heart rate variability\n",
      "Blood pressure\n",
      "Blood oxygen saturation\n",
      "Pulse wave velocity\n",
      "Cardiac output\n",
      "Peripheral blood flow\n",
      "Respiratory rate\n",
      "Oxygen uptake\n",
      "Carbon dioxide exhalation rate\n",
      "Lung volume\n",
      "Breathing rhythm\n",
      "Muscle activity\n",
      "Blood glucose levels\n",
      "Lactate levels\n",
      "Basal metabolic rate\n",
      "Core body temperature\n",
      "Brain activity\n",
      "Skin temperature\n",
      "Sweat rate\n",
      "Electrolyte concentration\n",
      "Skin hydration levels\n",
      "Skin conductance\n",
      "PH of sweat\n",
      "Sleep stages (light, deep, REM)\n",
      "Sleep apnea events\n",
      "Total sleep duration\n",
      "Sleep onset latency\n",
      "Wake after sleep onset\n",
      "Sleep efficiency\n",
      "Arousals per night\n",
      "Breathing irregularities\n",
      "Snoring patterns\n",
      "Circadian rhythm patterns\n",
      "Steps taken\n",
      "Distance traveled\n",
      "Active time\n",
      "Energy expenditure\n",
      "Activity level\n",
      "Running dynamics\n",
      "Balance and stability\n",
      "Joint movement and flexibility\n",
      "Mental stress\n",
      "Mental fatigue\n",
      "Mental workload\n",
      "Engagement\n",
      "Cognitive load\n",
      "Memory performance\n",
      "Decision-making speed\n",
      "Mood\n",
      "Ambient temperature\n",
      "Humidity\n",
      "Barometric pressure\n",
      "UV radiation exposure\n",
      "Air quality\n",
      "Noise levels\n",
      "Electromagnetic field exposure\n",
      "Altitude\n",
      "GPS location\n",
      "Travel patterns\n",
      "Proximity to other devices or people\n",
      "Interaction frequency with social contacts\n",
      "Time spent on specific activities\n",
      "Screen interaction patterns\n",
      "Daily routine adherence\n",
      "Resting time\n",
      "Inactive time\n",
      "Lightly active time\n",
      "Moderately active time\n",
      "Highly active time\n",
      "Exercise\n",
      "Step goal\n",
      "Asleep duration\n",
      "Light sleep duration\n",
      "Deep sleep duration\n",
      "Rem sleep duration\n",
      "Bedtime start time\n",
      "Bedtime end time\n",
      "Midpoint of sleep\n",
      "Time after wakeup\n",
      "HRV RMSSD\n",
      "Resting heart rate\n",
      "Nightly skin temperature\n",
      "Sleep breathing rate\n",
      "Temperature Variation\n",
      "VO2 Max\n",
      "PANAS positive affect\n",
      "PANAS negative affect\n",
      "Anxiety\n",
      "Depression\n",
      "Lifelog\n",
      "Number of calls\n",
      "Entropy of call duration\n",
      "Number of phone unlock\n",
      "Duration of phone unlock\n",
      "Time at home\n",
      "The Radius of Gyration\n",
      "Maximum distance from home\n",
      "Age\n",
      "Gender\n",
      "Bmi\n",
      "Personality\n"
     ]
    }
   ],
   "source": [
    "for n in nodes:\n",
    "    print(nodes[n].name)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "QA_df = pd.read_json(f\"{root_dir}/qa_df_full.json\", orient='records')\n",
    "QA_df_with_queries = QA_df\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import pandas as pd\n",
    "from typing import Any, Dict, List, Union\n",
    "def convert_to_serializable(obj: Any) -> Any:\n",
    "    if isinstance(obj, pd.Timestamp):\n",
    "        return obj.isoformat()\n",
    "    elif hasattr(obj, '__dict__'):  # For Entity and similar custom objects\n",
    "        return {k: convert_to_serializable(v) for k, v in obj.__dict__.items()}\n",
    "    elif isinstance(obj, dict):\n",
    "        return {k: convert_to_serializable(v) for k, v in obj.items()}\n",
    "    elif isinstance(obj, (list, tuple)):\n",
    "        return [convert_to_serializable(x) for x in obj]\n",
    "    return obj"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Processing datasets:   0%|          | 0/4 [00:00<?, ?it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "lifesnap\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n",
      "\u001b[A/var/folders/n4/pwy0ts2n7hjg6wg7l9lc63k80000gn/T/ipykernel_15663/2723791789.py:242: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.\n",
      "  results_df = pd.concat([results_df, row_df], ignore_index=True)\n",
      "\n",
      "\u001b[A\n",
      "\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Inactive timeInactive time\n",
      "\n",
      "Inactive time\n",
      "Inactive time\n",
      "Inactive time\n",
      "Inactive time\n",
      "Inactive time\n",
      "Inactive time\n",
      "Inactive time\n",
      "Inactive time\n",
      "Inactive time\n",
      "Active time\n",
      "Active time\n",
      "Active time\n",
      "Active time\n",
      "Active time\n",
      "Active time\n",
      "Active time\n",
      "Active time\n",
      "Active time\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Processing queries:   1%|          | 2/307 [00:00<00:42,  7.26it/s]\u001b[A\u001b[A\n",
      "\u001b[A\n",
      "\n",
      "Processing queries:   1%|▏         | 4/307 [00:00<00:40,  7.47it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Active time\n",
      "Active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Lightly active time\n",
      "Moderately active time\n",
      "Moderately active time\n",
      "Moderately active time\n",
      "Moderately active time\n",
      "Moderately active time\n",
      "Moderately active time\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[A\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Moderately active time\n",
      "Moderately active time\n",
      "Moderately active time\n",
      "Moderately active time\n",
      "Moderately active time\n",
      "Highly active time\n",
      "Highly active time\n",
      "Highly active time\n",
      "Highly active time\n",
      "Highly active time\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n",
      "\u001b[A\n",
      "\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Highly active time\n",
      "Highly active time\n",
      "Highly active time\n",
      "Highly active time\n",
      "Highly active time\n",
      "Highly active time\n",
      "Steps taken\n",
      "Steps taken\n",
      "Steps taken\n",
      "Steps taken\n",
      "Steps taken\n",
      "Steps taken\n",
      "Steps taken\n",
      "Steps taken\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Processing queries:  17%|█▋        | 53/307 [00:01<00:03, 68.24it/s]\u001b[A\u001b[A\n",
      "\u001b[A\n",
      "\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Steps takenSteps taken\n",
      "\n",
      "Steps taken\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Distance traveled\n",
      "Energy expenditure\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Processing queries:  22%|██▏       | 68/307 [00:01<00:03, 59.86it/s]\u001b[A\u001b[A\n",
      "\n",
      "Processing queries:  24%|██▍       | 75/307 [00:01<00:04, 51.10it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Energy expenditure\n",
      "Total sleep duration\n",
      "Energy expenditure\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[A\u001b[A\n",
      "\u001b[A\n",
      "\n",
      "Processing queries:  28%|██▊       | 87/307 [00:01<00:04, 54.21it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Total sleep duration\n",
      "Asleep duration\n",
      "Asleep duration\n",
      "Asleep duration\n",
      "Asleep duration\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[A\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Asleep durationAsleep duration\n",
      "\n",
      "Asleep duration\n",
      "Asleep duration\n",
      "Asleep duration\n",
      "Asleep duration\n",
      "Light sleep duration\n",
      "Asleep duration\n",
      "Light sleep duration\n",
      "Light sleep duration\n",
      "Light sleep duration\n",
      "Light sleep duration\n",
      "Light sleep duration\n",
      "Light sleep duration\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\n",
      "Processing queries:  39%|███▉      | 119/307 [00:02<00:03, 50.53it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Light sleep duration\n",
      "Light sleep duration\n",
      "Light sleep duration\n",
      "Light sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Deep sleep duration\n",
      "Rem sleep duration\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[A\u001b[A\n",
      "Processing queries:  43%|████▎     | 131/307 [00:02<00:03, 49.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Rem sleep duration\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Wake after sleep onset\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep efficiency\n",
      "Sleep onset latency\n",
      "Time after wakeup\n",
      "Time after wakeup\n",
      "Time after wakeup\n",
      "Time after wakeup\n",
      "HRV RMSSD\n",
      "Time after wakeup\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "HRV RMSSD\n",
      "Resting heart rate\n",
      "HRV RMSSD\n",
      "Resting heart rate\n",
      "Resting heart rate\n",
      "Resting heart rate\n",
      "Resting heart rate\n",
      "Resting heart rateResting heart rate\n",
      "\n",
      "Resting heart rate\n",
      "Resting heart rate\n",
      "Resting heart rate\n",
      "Resting heart rate\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Nightly skin temperature\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Blood oxygen saturation\n",
      "Sleep breathing rate\n",
      "Blood oxygen saturation\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Sleep breathing rate\n",
      "Temperature Variation\n",
      "Sleep breathing rate\n",
      "Temperature Variation\n",
      "Temperature Variation\n",
      "Temperature Variation\n",
      "Temperature Variation\n",
      "Temperature Variation\n",
      "Temperature Variation\n",
      "Temperature VariationTemperature Variation\n",
      "Temperature Variation\n",
      "\n",
      "Temperature Variation\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "VO2 Max\n",
      "Skin conductance\n",
      "PANAS positive affect\n",
      "PANAS positive affect\n",
      "PANAS positive affect\n",
      "PANAS positive affect\n",
      "PANAS positive affect\n",
      "PANAS negative affect\n",
      "PANAS negative affect\n",
      "PANAS negative affect\n",
      "PANAS negative affect\n",
      "PANAS negative affect\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime start time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Bedtime end time\n",
      "Mood\n",
      "Bedtime end time\n",
      "Daily routine adherence\n",
      "Engagement\n",
      "Cognitive load\n",
      "Activity level\n",
      "Screen interaction patternsSteps taken\n",
      "\n",
      "Asleep duration\n",
      "Sleep breathing rate\n",
      "Distance traveled\n",
      "Bedtime start time\n",
      "Total sleep duration\n",
      "Distance traveled\n",
      "Bedtime start time\n",
      "Deep sleep duration\n",
      "Bedtime start time\n",
      "Energy expenditure\n",
      "Sleep efficiency\n",
      "Time after wakeup\n",
      "Steps taken\n",
      "Wake after sleep onset\n",
      "Temperature Variation\n",
      "PANAS negative affect\n",
      "Bedtime end time\n",
      "VO2 Max\n",
      "Sleep onset latency\n",
      "Wake after sleep onset\n",
      "Temperature Variation\n",
      "Steps taken\n",
      "Active time\n",
      "Deep sleep duration\n",
      "Resting heart rate\n",
      "Light sleep duration\n",
      "Resting heart rate\n",
      "Mood\n",
      "Rem sleep duration\n",
      "Active time\n",
      "Moderately active time\n",
      "Sleep breathing rate\n",
      "Energy expenditure\n",
      "Blood oxygen saturation\n",
      "Deep sleep duration\n",
      "Resting heart rate\n",
      "Sleep breathing rateSteps taken\n",
      "\n",
      "Wake after sleep onset\n",
      "Deep sleep duration\n",
      "Bedtime end time\n",
      "Bedtime start time\n",
      "Resting heart rate\n",
      "Highly active time\n",
      "Nightly skin temperature\n",
      "HRV RMSSD\n",
      "Rem sleep duration\n",
      "Mood\n",
      "Time after wakeup\n",
      "VO2 Max\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Processing users for lifesnap:   0%|          | 0/10 [00:07<?, ?it/s]\n",
      "Processing datasets:   0%|          | 0/4 [00:07<?, ?it/s]\n"
     ]
    },
    {
     "ename": "KeyboardInterrupt",
     "evalue": "",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[6], line 227\u001b[0m\n\u001b[1;32m    221\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m ThreadPoolExecutor(max_workers\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m10\u001b[39m) \u001b[38;5;28;01mas\u001b[39;00m executor:\n\u001b[1;32m    222\u001b[0m     future_to_row \u001b[38;5;241m=\u001b[39m {\n\u001b[1;32m    223\u001b[0m         executor\u001b[38;5;241m.\u001b[39msubmit(process_single_row, row, clients, par_df, dataset_name, rel_info, user_id): row \n\u001b[1;32m    224\u001b[0m         \u001b[38;5;28;01mfor\u001b[39;00m _, row \u001b[38;5;129;01min\u001b[39;00m queries_per_user\u001b[38;5;241m.\u001b[39miterrows()\n\u001b[1;32m    225\u001b[0m     }\n\u001b[0;32m--> 227\u001b[0m \u001b[43m    \u001b[49m\u001b[38;5;28;43;01mfor\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mfuture\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;129;43;01min\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mtqdm\u001b[49m\u001b[43m(\u001b[49m\u001b[43mas_completed\u001b[49m\u001b[43m(\u001b[49m\u001b[43mfuture_to_row\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtotal\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43mlen\u001b[39;49m\u001b[43m(\u001b[49m\u001b[43mfuture_to_row\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdesc\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mProcessing queries\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m)\u001b[49m\u001b[43m:\u001b[49m\n\u001b[1;32m    228\u001b[0m \u001b[43m        \u001b[49m\u001b[38;5;28;43;01mtry\u001b[39;49;00m\u001b[43m:\u001b[49m\n\u001b[1;32m    229\u001b[0m \u001b[43m            \u001b[49m\u001b[43mq_dict\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mnew_rows\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43m \u001b[49m\u001b[43mfuture\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mresult\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
      "File \u001b[0;32m~/Documents/projects/WAG-Code/.venv/lib/python3.13/site-packages/tqdm/std.py:1181\u001b[0m, in \u001b[0;36mtqdm.__iter__\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1178\u001b[0m time \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_time\n\u001b[1;32m   1180\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[0;32m-> 1181\u001b[0m \u001b[43m    \u001b[49m\u001b[38;5;28;43;01mfor\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mobj\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;129;43;01min\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43miterable\u001b[49m\u001b[43m:\u001b[49m\n\u001b[1;32m   1182\u001b[0m \u001b[43m        \u001b[49m\u001b[38;5;28;43;01myield\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mobj\u001b[49m\n\u001b[1;32m   1183\u001b[0m \u001b[43m        \u001b[49m\u001b[38;5;66;43;03m# Update and possibly print the progressbar.\u001b[39;49;00m\n\u001b[1;32m   1184\u001b[0m \u001b[43m        \u001b[49m\u001b[38;5;66;43;03m# Note: does not call self.update(1) for speed optimisation.\u001b[39;49;00m\n",
      "File \u001b[0;32m/opt/homebrew/Cellar/python@3.13/3.13.1/Frameworks/Python.framework/Versions/3.13/lib/python3.13/concurrent/futures/_base.py:243\u001b[0m, in \u001b[0;36mas_completed\u001b[0;34m(fs, timeout)\u001b[0m\n\u001b[1;32m    238\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m wait_timeout \u001b[38;5;241m<\u001b[39m \u001b[38;5;241m0\u001b[39m:\n\u001b[1;32m    239\u001b[0m         \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mTimeoutError\u001b[39;00m(\n\u001b[1;32m    240\u001b[0m                 \u001b[38;5;124m'\u001b[39m\u001b[38;5;132;01m%d\u001b[39;00m\u001b[38;5;124m (of \u001b[39m\u001b[38;5;132;01m%d\u001b[39;00m\u001b[38;5;124m) futures unfinished\u001b[39m\u001b[38;5;124m'\u001b[39m \u001b[38;5;241m%\u001b[39m (\n\u001b[1;32m    241\u001b[0m                 \u001b[38;5;28mlen\u001b[39m(pending), total_futures))\n\u001b[0;32m--> 243\u001b[0m \u001b[43mwaiter\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mevent\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mwait\u001b[49m\u001b[43m(\u001b[49m\u001b[43mwait_timeout\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    245\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m waiter\u001b[38;5;241m.\u001b[39mlock:\n\u001b[1;32m    246\u001b[0m     finished \u001b[38;5;241m=\u001b[39m waiter\u001b[38;5;241m.\u001b[39mfinished_futures\n",
      "File \u001b[0;32m/opt/homebrew/Cellar/python@3.13/3.13.1/Frameworks/Python.framework/Versions/3.13/lib/python3.13/threading.py:659\u001b[0m, in \u001b[0;36mEvent.wait\u001b[0;34m(self, timeout)\u001b[0m\n\u001b[1;32m    657\u001b[0m signaled \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_flag\n\u001b[1;32m    658\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m signaled:\n\u001b[0;32m--> 659\u001b[0m     signaled \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_cond\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mwait\u001b[49m\u001b[43m(\u001b[49m\u001b[43mtimeout\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    660\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m signaled\n",
      "File \u001b[0;32m/opt/homebrew/Cellar/python@3.13/3.13.1/Frameworks/Python.framework/Versions/3.13/lib/python3.13/threading.py:359\u001b[0m, in \u001b[0;36mCondition.wait\u001b[0;34m(self, timeout)\u001b[0m\n\u001b[1;32m    357\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:    \u001b[38;5;66;03m# restore state no matter what (e.g., KeyboardInterrupt)\u001b[39;00m\n\u001b[1;32m    358\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m timeout \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m--> 359\u001b[0m         \u001b[43mwaiter\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43macquire\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    360\u001b[0m         gotit \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m    361\u001b[0m     \u001b[38;5;28;01melse\u001b[39;00m:\n",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m: "
     ]
    }
   ],
   "source": [
    "from concurrent.futures import ThreadPoolExecutor, as_completed\n",
    "import traceback\n",
    "hyperparameter = {\n",
    "    'rel_type': 'spearman',\n",
    "    'min_samples_needed': 10, # min number of samples needed to calculate relationship \n",
    "    't_global': 0.9,  #steepness of the sigmoid transformation  of correlation \n",
    "    'alpha_prior': 1, #prior weight\n",
    "    'alpha_pop':10**(0.94), #population weight\n",
    "    'alpha_ind': 10**(-1.31), #individual weight\n",
    "\n",
    "    't_local': 0.7, # control steepness of sigmoid transformation of abnromaility weight\n",
    "    'beta': 0.5, #weight of abnormality weight\n",
    "\n",
    "    'node_match_top_n': 1,\n",
    "    'max_num_related_nodes': 5,\n",
    "\n",
    "    'full_rel_only': False,\n",
    "    'demog_metrics': ['Bmi','Age','Gender','Personality'],\n",
    "    'weight_sort_by': 'rel_pop', #\n",
    "}\n",
    "\n",
    "\n",
    "parm_final = hyperparameter.copy()\n",
    "parm_final['weight_sort_by'] = 'weight_final'\n",
    "\n",
    "weight_keys = [\n",
    "            'llm_prior','rel_pop', 'posterior_pop', 'rel_ind',\n",
    "            'posterior_ind','weight_local','weight_global', 'weight_final'\n",
    "        ]\n",
    "\n",
    "demog_metrics = set(hyperparameter['demog_metrics'])\n",
    "prior_matrix = get_prior_matrix(root_dir+'/kg')\n",
    "\n",
    "results_df = pd.DataFrame(columns=[\n",
    "        'q_id', 'dataset', 'user_id', 'query', 'query_date', 'time_granularity',\n",
    "        'openness(assigned)', 'associated_entity(gt)', 'method',\n",
    "        'primary_nodes', 'related_nodes', 'context', 'response','data','eval_result'\n",
    "    ])\n",
    "\n",
    "datasets_to_eval = QA_df_with_queries.dataset.unique()\n",
    "# datasets_to_eval = ['globem']\n",
    "\n",
    "from tqdm import tqdm\n",
    "\n",
    "for dataset_name in tqdm(datasets_to_eval, desc=\"Processing datasets\"):\n",
    "    print(dataset_name)\n",
    "    with open(f'{root_dir}/processed_dataset/{path_map[dataset_name]}.csv', 'r') as f:\n",
    "            pop_df = pd.read_csv(f)\n",
    "    numeric_metrics = [col for col in pop_df.columns if pd.api.types.is_numeric_dtype(pop_df[col]) and pop_df[col].notna().sum() > 0]\n",
    "    data_associated_metrics = list(set(dataset_metric_dict[dataset_name])-demog_metrics-set(['Step goal','Exercise']))\n",
    "    # print(data_associated_metrics)\n",
    "    rel_pop_all, sample_size_pop_all, _, numeric_metrics = get_relationship_matrix(relationship_dict[dataset_name], rel_type = hyperparameter['rel_type'], data_type = 'pop')\n",
    "    user_ids = QA_df_with_queries[QA_df_with_queries['dataset'] == dataset_name]['user_id'].unique()\n",
    "    user_ids = user_ids\n",
    "    for user_id in tqdm(user_ids, desc=f\"Processing users for {dataset_name}\"):\n",
    "        par_df_original = pop_df[pop_df['participant_id'] == user_id]\n",
    "        par_df = par_df_original.copy()\n",
    "        rel_ind_all, sample_size_ind_all, _, numeric_metrics = get_relationship_matrix(relationship_dict[dataset_name]['users'][user_id], rel_type = hyperparameter['rel_type'], data_type = 'ind')\n",
    "        \n",
    "        rel_info = {'rel_pop_all': rel_pop_all, \n",
    "                'rel_var_pop_all': None, \n",
    "                'rel_pop_sample_size_all': sample_size_pop_all, \n",
    "                'rel_ind_all': rel_ind_all,\n",
    "                'rel_var_ind_all': None,\n",
    "                'rel_ind_sample_size_all': sample_size_ind_all,\n",
    "                'numeric_metrics': numeric_metrics,\n",
    "                'data_associated_metrics': data_associated_metrics,\n",
    "                }\n",
    "        \n",
    "        queries_per_user = QA_df_with_queries[QA_df_with_queries['user_id'] == user_id]\n",
    "        # queries_per_user = queries_per_user[queries_per_user['recent_abnormality'].isin(['low','medium','high'])]\n",
    "        # print('len_query', len(queries_per_user))\n",
    "    \n",
    "        # Initialize clients for different methods\n",
    "        chat_model = \"deepseek\"\n",
    "        clients = {}\n",
    "\n",
    "        clients['Base'] = Base(\n",
    "            chat_client=chat_model,\n",
    "            param=None\n",
    "        )\n",
    "\n",
    "        clients['Rag'] = Rag(\n",
    "            chat_client=chat_model,\n",
    "            param=None\n",
    "        )\n",
    "\n",
    "        clients['Wag'] = Wag(\n",
    "            chat_client=chat_model,\n",
    "            param=parm_final\n",
    "        )\n",
    "      \n",
    "        def process_query_row(row, clients, par_df, dataset_name, rel_info):\n",
    "            \"\"\"Process a single query row and return results for all methods\"\"\"\n",
    "            question = row['query']\n",
    "            # print(question)\n",
    "            \n",
    "            query_info = {\n",
    "                'query_date': row['query_date'],\n",
    "                'time_granularity': row['time_granularity'], \n",
    "                'openness': row['openness(assigned)']\n",
    "            }\n",
    "\n",
    "            results = {}\n",
    "            for method_name, client in clients.items():\n",
    "                try:\n",
    "                    # print(method_name)\n",
    "                    results[method_name],_ = client.query_quick(\n",
    "                        user_query=question,\n",
    "                        par_df=par_df.copy(),\n",
    "                        gt_nodes=row['associated_entity(gt)'],\n",
    "                        query_info=query_info,\n",
    "                        dataset_name=dataset_name,\n",
    "                        rel_info=rel_info,\n",
    "                        response_gen=True,\n",
    "                    )\n",
    "                except Exception as e:\n",
    "                    print(f\"Error processing {method_name}: {e}\")\n",
    "                    print(traceback.format_exc())\n",
    "                    results[method_name] = None\n",
    "            \n",
    "    \n",
    "            # # Collect related nodes for each method\n",
    "            # method_related_nodes = {}\n",
    "            # for method_name, result in results.items():\n",
    "            #     if result is None:\n",
    "            #         continue\n",
    "                    \n",
    "            #     related_nodes = set()\n",
    "                \n",
    "            #     for entity_dict in result['result_dict'].values():\n",
    "            #         for node, _, _, abnormality in entity_dict['related_nodes']:\n",
    "            #             related_nodes.add(node.name)\n",
    "            #             # print(node.name, abnormality)\n",
    "            #     method_related_nodes[method_name] = related_nodes\n",
    "            # # print(\"Method related nodes:\", method_related_nodes)\n",
    "            \n",
    "            # if method_related_nodes:  # Only check if we have results\n",
    "            #     # Check if all methods generate different results\n",
    "            #     all_different = True\n",
    "            #     for method1, nodes1 in method_related_nodes.items():\n",
    "            #         for method2, nodes2 in method_related_nodes.items():\n",
    "            #             if method1 != method2 and nodes1 == nodes2:\n",
    "            #                 all_different = False\n",
    "            #                 break\n",
    "            #         if not all_different:\n",
    "            #             break\n",
    "                        \n",
    "    \n",
    "            return results\n",
    "\n",
    "\n",
    "        def process_method_results(results, row, dataset_name, user_id):\n",
    "            \"\"\"Process results from all methods and return DataFrame rows\"\"\"\n",
    "\n",
    "            rows = []\n",
    "            q_dict = {\n",
    "                'q_id': row['q_id'],\n",
    "                'dataset': dataset_name,\n",
    "                'user_id': user_id, \n",
    "                'query': row['query'],\n",
    "                'query_date': row['query_date'],\n",
    "                'time_granularity': row['time_granularity'],\n",
    "                'openness(assigned)': row['openness(assigned)'],\n",
    "                'result': {}\n",
    "            }\n",
    "            for method_name, result in results.items():\n",
    "                if result is None:\n",
    "                    continue\n",
    "                    \n",
    "                primary_nodes = []\n",
    "                related_nodes = set()\n",
    "                \n",
    "                for entity in result['result_dict']:\n",
    "                    primary_nodes.append(result['result_dict'][entity]['primary_node'][0].name)\n",
    "                    for node, edge, weight, abnormality in result['result_dict'][entity]['related_nodes']:\n",
    "                        related_nodes.add(node.name)\n",
    "                data = convert_to_serializable(result.get('data', {}))\n",
    "                new_row = {\n",
    "                    'q_id': row['q_id'],\n",
    "                    'dataset': dataset_name,\n",
    "                    'user_id': user_id, \n",
    "                    'query': row['query'],\n",
    "                    'query_date': row['query_date'],\n",
    "                    'time_granularity': row['time_granularity'],\n",
    "                    'openness(assigned)': row['openness(assigned)'],\n",
    "                    'associated_entity(gt)': row['associated_entity(gt)'],\n",
    "                    'method': method_name,\n",
    "                    'primary_nodes': primary_nodes,\n",
    "                    'related_nodes': list(related_nodes),\n",
    "                    'context': result.get('context', ''),\n",
    "                    'response': result.get('response', ''),\n",
    "                    'data': data,\n",
    "                }\n",
    "   \n",
    "                q_dict['result'][method_name] = {\n",
    "                    # 'result_dict': result.get('result_dict', {}),\n",
    "                    'primary_nodes': primary_nodes,\n",
    "                    'related_nodes': list(related_nodes),\n",
    "                    'context': result.get('context', ''),\n",
    "                    'response': result.get('response', ''),\n",
    "                    'data': data\n",
    "                }\n",
    "                \n",
    "                rows.append(new_row)\n",
    "   \n",
    "            return q_dict, rows\n",
    "\n",
    "        # Process queries in parallel batches\n",
    "        \n",
    "\n",
    "        def process_single_row(row, clients, par_df, dataset_name, rel_info, user_id):\n",
    "            try:\n",
    "                results = process_query_row(row, clients, par_df, dataset_name, rel_info)\n",
    "                return process_method_results(results, row, dataset_name, user_id)\n",
    "            except Exception as e:\n",
    "                print(f\"Error processing row: {e}\")\n",
    "                return []\n",
    "\n",
    "        result_dict = {}\n",
    "        with ThreadPoolExecutor(max_workers=10) as executor:\n",
    "            future_to_row = {\n",
    "                executor.submit(process_single_row, row, clients, par_df, dataset_name, rel_info, user_id): row \n",
    "                for _, row in queries_per_user.iterrows()\n",
    "            }\n",
    "\n",
    "            for future in tqdm(as_completed(future_to_row), total=len(future_to_row), desc=\"Processing queries\"):\n",
    "                try:\n",
    "                    q_dict, new_rows = future.result()\n",
    "                    result_dict[q_dict['q_id']] = q_dict\n",
    "                    # print(q_dict)\n",
    "                    # for d in q_dict:\n",
    "                    #     result_dict[d['q_id']] = d\n",
    "\n",
    "                    for row in new_rows:\n",
    "                        # Convert row to DataFrame and ensure all columns exist\n",
    "                        row_df = pd.DataFrame([row])\n",
    "                        # Ensure row_df has same columns as results_df\n",
    "                        for col in results_df.columns:\n",
    "                            if col not in row_df.columns:\n",
    "                                row_df[col] = pd.NA\n",
    "                        results_df = pd.concat([results_df, row_df], ignore_index=True)\n",
    "                except Exception as e:\n",
    "                    print(f\"Error processing results: {e}\")\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "\n",
    "results_df_short = results_df\n",
    "results_df_short['related_nodes_tuple'] = results_df_short['related_nodes'].apply(\n",
    "    lambda x: tuple(sorted(x))\n",
    ")\n",
    "results_df_short = results_df_short[\n",
    "    results_df.groupby('q_id')['related_nodes_tuple'].transform('nunique') ==\n",
    "    results_df.groupby('q_id')['related_nodes_tuple'].transform('count')\n",
    "]\n",
    "grouped_df = results_df_short.groupby('q_id')\n",
    "print(len(grouped_df))\n",
    "\n",
    "q_ids = list(grouped_df.groups.keys())\n",
    "# with open(f'{root_dir}/experiment_result/local/query_ids_w_diff_res.json', 'w') as f:\n",
    "#     json.dump(q_ids, f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# with open(f\"{root_dir}/experiment_result/general/results_df_no_response.json\", 'r') as f:\n",
    "#     results_df = json.load(f)\n",
    "\n",
    "# Group by q_id\n",
    "grouped_df = results_df.groupby('q_id')\n",
    "\n",
    "# Remove rows where response is missing\n",
    "# results_df = results_df.dropna(subset=['response'])\n",
    "\n",
    "\n",
    "# Convert DataFrame to dictionary\n",
    "result_dict = {}\n",
    "for q_id, group in grouped_df:\n",
    "    # print(group)\n",
    "    # print(group.to_dict('record')[0])\n",
    "    result_dict[q_id] = group.to_dict('records')\n",
    "\n",
    "\n",
    "# Convert to JSON-compatible format\n",
    "# result_dict = json.loads(json.dumps(result_dict))\n",
    "result_dict = clean_for_json(result_dict)\n",
    "with open(f'{root_dir}/experiment_result/general/test_result_dict_10.json', 'w') as f:\n",
    "    json.dump(result_dict, f, indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(result_dict)\n",
    "for q_id, q_dict in result_dict.items():\n",
    "    for method, data in q_dict['result'].items():\n",
    "        d1 = data['data']\n",
    "        break\n",
    "        # with open(f'{root_dir}/result_dict_{q_id}_{method}.json', 'w') as f:\n",
    "        #     json.dump(data, f)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": ".venv",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.1"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
