{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 162,
   "id": "03ccece4",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[nltk_data] Downloading package stopwords to /root/nltk_data...\n",
      "[nltk_data]   Package stopwords is already up-to-date!\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 162,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import os\n",
    "import fitz\n",
    "import sys\n",
    "import re\n",
    "import json\n",
    "from datetime import datetime\n",
    "from typing import Optional, List, Callable, Any, Tuple, Dict\n",
    "from abc import abstractmethod, ABC\n",
    "import random\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import copy\n",
    "import nltk\n",
    "from nltk.corpus import stopwords\n",
    "import pickle\n",
    "import itertools\n",
    "from dataclasses import dataclass, asdict\n",
    "from tqdm import tqdm\n",
    "from enum import Enum\n",
    "from dotenv import load_dotenv\n",
    "\n",
    "sys.path.append(\"../\")\n",
    "\n",
    "load_dotenv(dotenv_path=\"../.env\")\n",
    "nltk.download('stopwords')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 163,
   "id": "ce7b2c0a",
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import file_handle, grouping\n",
    "from utils.tree import Node"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 164,
   "id": "33db05dd",
   "metadata": {},
   "outputs": [],
   "source": [
    "from dataset_utils.reader import ADIQDataset\n",
    "from dataset_utils.question import Question\n",
    "\n",
    "\n",
    "ds = ADIQDataset(\"../dataset/datasets/simpleV3.1\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 165,
   "id": "dd5da751",
   "metadata": {},
   "outputs": [],
   "source": [
    "rule_information = file_handle.load_pickle(\n",
    "    os.path.join(\"../dataset/test_datasets/TEST_TreeStruct.pkl\")\n",
    ")\n",
    "\n",
    "asset_descriptions = ds.asset_descriptions"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "fd9cf727",
   "metadata": {},
   "source": [
    "# Observation stats "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 166,
   "id": "c5d1811c",
   "metadata": {},
   "outputs": [],
   "source": [
    "total_obs = list()\n",
    "unq_obs = set()\n",
    "for d in rule_information[\"rule_set\"]:\n",
    "    unq_obs = unq_obs.union(set(d[\"display_text\"][\"observations\"]))\n",
    "    total_obs.extend(d[\"display_text\"][\"observations\"])\n",
    "\n",
    "len(total_obs), len(unq_obs)\n",
    "\n",
    "unq_obs = list(unq_obs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 167,
   "id": "18c039c2",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 : Boiler tube fouling\n",
      "1 : Economizer fouling\n",
      "2 : Condenser water high temperature\n",
      "3 : Chiller refrigerant leak\n",
      "4 : Flow meter calibration\n",
      "5 : Blowdown valve failure\n",
      "6 : Outside air temperature sensor failure\n",
      "7 : Cooling tower reset in manual\n",
      "8 : Condenser water low flow\n",
      "9 : Increased load on PDU\n",
      "10 : Temperature sensor calibration\n",
      "11 : Too few chillers running\n",
      "12 : Excessive load\n",
      "13 : Dryer not functioning\n",
      "14 : Fuel supply valve issue\n",
      "15 : Too many pumps running\n",
      "16 : Make up water valve issue\n",
      "17 : Chilled water valve failure\n",
      "18 : Power Meter Current Transformer issue\n",
      "19 : System leak\n",
      "20 : Conductivity meter issue causing excessive blowdown\n",
      "21 : Chilled water valve maunal override\n",
      "22 : Pressure sensor calibration\n",
      "23 : Air to air heat exhanger clogged/dirty\n",
      "24 : Too few pumps running\n",
      "25 : Chilled water high return temp\n",
      "26 : Chilled water flow meter calibration\n",
      "27 : Level sensor issue\n",
      "28 : VFD speed control in manual\n",
      "29 : Chilled water high flow\n",
      "30 : Water to aire heat exhanger fouled\n",
      "31 : Too few cooling towers running\n",
      "32 : Fuel filter clogged\n",
      "33 : VFD communications issue\n",
      "34 : Water to air heat exchanger low water flow\n",
      "35 : Fuel supply issue\n",
      "36 : Makeup water level issue\n",
      "37 : Too many cnodenser pumps running\n",
      "38 : Condenser pumps in manual\n"
     ]
    }
   ],
   "source": [
    "for i, unq in enumerate(unq_obs):\n",
    "    print(\"{} : {}\".format(i,unq))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 168,
   "id": "647b83fe",
   "metadata": {},
   "outputs": [],
   "source": [
    "from sentence_transformers import SentenceTransformer\n",
    "\n",
    "# 1. Load a pretrained Sentence Transformer model\n",
    "model = SentenceTransformer(\"all-MiniLM-L6-v2\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 169,
   "id": "87c78365",
   "metadata": {},
   "outputs": [],
   "source": [
    "enc = model.encode(unq_obs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 170,
   "id": "c609468a",
   "metadata": {},
   "outputs": [],
   "source": [
    "norm = np.linalg.norm(enc, axis=1)\n",
    "norm = np.outer(norm,norm) + 1e-6"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 171,
   "id": "b5f886a4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.99999917\n"
     ]
    }
   ],
   "source": [
    "_thresh = 0.992\n",
    "cosine_sim = (enc @ enc.T)/norm\n",
    "cosine_sim = np.abs(cosine_sim)\n",
    "\n",
    "thresh = np.quantile(cosine_sim.flatten(),_thresh)\n",
    "print(thresh)\n",
    "for i in range(cosine_sim.shape[0]):\n",
    "    for j in range(i, cosine_sim.shape[0]):\n",
    "        cosine_sim[i,j] = 0\n",
    "\n",
    "ind = np.where(cosine_sim>thresh)\n",
    "\n",
    "observation_map = {}\n",
    "\n",
    "edges = []\n",
    "for x,y in zip(ind[0], ind[1]):\n",
    "    edges.append((x,y))\n",
    "    \n",
    "res = grouping.getComponents(cosine_sim.shape[0], edges)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 172,
   "id": "c5fe8758",
   "metadata": {},
   "outputs": [],
   "source": [
    "obs_mapping = {}\n",
    "for r in res:\n",
    "    if len(r)>1:\n",
    "        major = np.argmax([len(unq_obs[x]) for x in r])\n",
    "        major = unq_obs[r[major]]\n",
    "        \n",
    "        for r0 in r:\n",
    "            obs_mapping[unq_obs[r0]] = major \n",
    "    else:\n",
    "        obs_mapping[unq_obs[r[0]]] = unq_obs[r[0]]"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0237c89e",
   "metadata": {},
   "source": [
    "# Rule stats "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 173,
   "id": "10842de7",
   "metadata": {},
   "outputs": [],
   "source": [
    "rule_information = file_handle.load_json(\n",
    "    os.path.join(\"../dataset/test_datasets/TEST_rule_information.json\")\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 174,
   "id": "e374cc36",
   "metadata": {},
   "outputs": [],
   "source": [
    "total_rules = list()\n",
    "unq_rules = set()\n",
    "for d in rule_information[\"rule_set\"]: \n",
    "    s = (d[\"display_text\"][\"rules\"].replace(\"-\",\"\").replace(\"OR\", \"\").replace(\"(\", \"\").replace(\")\", \"\")).split(\"\\n\")\n",
    "    s = [x.strip() for x in s]\n",
    "    unq_rules = unq_rules.union(set(s))\n",
    "    total_rules.extend(s)\n",
    "\n",
    "unq_rules = list(unq_rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 175,
   "id": "1c893968",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(47, 38)"
      ]
     },
     "execution_count": 175,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(total_rules), len(unq_rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 176,
   "id": "26908fc6",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['Cooling Tower Running',\n",
       " \"Sum of Child Pumps' KW / Condenser Water Flow > xx\",\n",
       " 'Chilled water Supply temp  Chilled water supply temp setpoint  < 2 degF',\n",
       " 'Condenser Water Flow > 50 gallon/minute',\n",
       " 'ABSSteam Pressure  135 PSI > 15 PSIG IF Steam Pressure Setpoint NOT Reporting',\n",
       " 'VFD Speed % > 97%',\n",
       " 'Supply Temp Setpoint = Previous Hour Supply Air Temp Setpoint',\n",
       " 'Coolant Flow > 50 g/m',\n",
       " 'Power Input > 5 Standard Deviations from past 7 day average',\n",
       " 'Met for 3 Hours Checking Previous 3 Days Daily Average',\n",
       " 'Power Input > 0.1KW',\n",
       " 'Number of Chillers Running is > 1',\n",
       " 'Chiller Running',\n",
       " 'Chilled Water Supply Temp  Chilled Water Supply Temp Setpoint  > 4 degF',\n",
       " 'Hot Water Boiler Gallons/BTU efficiency > XXX',\n",
       " 'Boiler Running',\n",
       " 'Fire Rate > 20%',\n",
       " 'Chiller % Loaded> 97%',\n",
       " '55 degF < Outside Air Temp < 80 degF',\n",
       " 'ABSSteam Pressure  Steam Pressure Setpoint > 15 PSIG',\n",
       " 'Discharge Air Temperature > 75 degF',\n",
       " 'Met for 2 Hours',\n",
       " 'Air Compressor Running',\n",
       " 'Met for 6 hours',\n",
       " 'Chilled Water Supply Temp  Chilled Water Supply Temp Setpoint  < 2 degF',\n",
       " 'Chilled water Supply temp  Chilled water supply temp setpoint  > 4 degF',\n",
       " 'Run Status Plate and Frame Point = 0',\n",
       " 'Makeup Water Flag = 1 > 3 times a day',\n",
       " 'Steam Boiler lbs/BTU efficiency > XXX',\n",
       " 'Condensate Flow / Steam Flow > Previous Day Value * 1.25',\n",
       " 'Humidification System Mode AHU Point = 0 IF Reporting',\n",
       " 'Met for 4 Hours',\n",
       " 'Chiller NOT Running',\n",
       " \"Sum of Child Pumps' VFD * HP tag value / Condenser Water Flow > yy\",\n",
       " 'Supply Temp Setpoint = Previous Daily Average Supply Air Temp Setpoint',\n",
       " 'None',\n",
       " 'Makeup Water Flow > Previous Day * 1.25',\n",
       " 'VFD Speed % < 30%']"
      ]
     },
     "execution_count": 176,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "unq_rules"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 177,
   "id": "62a85d9b",
   "metadata": {},
   "outputs": [],
   "source": [
    "enc = model.encode(unq_rules)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 178,
   "id": "ac52ce72",
   "metadata": {},
   "outputs": [],
   "source": [
    "norm = np.linalg.norm(enc, axis=1)\n",
    "norm = np.outer(norm,norm) + 1e-6"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 179,
   "id": "fe8af469",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.9999993\n"
     ]
    }
   ],
   "source": [
    "_thresh = 0.997\n",
    "cosine_sim = (enc @ enc.T)/norm\n",
    "cosine_sim = np.abs(cosine_sim)\n",
    "\n",
    "thresh = np.quantile(cosine_sim.flatten(),_thresh)\n",
    "print(thresh)\n",
    "for i in range(cosine_sim.shape[0]):\n",
    "    for j in range(i, cosine_sim.shape[0]):\n",
    "        cosine_sim[i,j] = 0\n",
    "\n",
    "ind = np.where(cosine_sim>thresh)\n",
    "\n",
    "edges = []\n",
    "for x,y in zip(ind[0], ind[1]):\n",
    "    edges.append((x,y))\n",
    "    \n",
    "res = grouping.getComponents(cosine_sim.shape[0], edges)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 180,
   "id": "7c877cda",
   "metadata": {},
   "outputs": [],
   "source": [
    "rules_mapping = {}\n",
    "for r in res:\n",
    "    if len(r)>1:\n",
    "        major = np.argmax([len(unq_rules[x]) for x in r])\n",
    "        major = unq_rules[r[major]]\n",
    "\n",
    "        print(\"Major: \\n{}\".format(major))\n",
    "        \n",
    "        for r0 in r:\n",
    "            print(unq_rules[r0])\n",
    "            rules_mapping[unq_rules[r0]] = major \n",
    "\n",
    "        print(\"\\n\")\n",
    "    else:\n",
    "        rules_mapping[unq_rules[r[0]]] = unq_rules[r[0]]"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "edf11b6b",
   "metadata": {},
   "source": [
    "# Rule Grouping with semantic understanding"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 181,
   "id": "f4e28c25",
   "metadata": {},
   "outputs": [],
   "source": [
    "from sentence_transformers import SentenceTransformer, util\n",
    "\n",
    "\n",
    "model = SentenceTransformer(\"all-mpnet-base-v2\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 182,
   "id": "97eddd7c",
   "metadata": {},
   "outputs": [],
   "source": [
    "rule_repr_dict:Dict[str,str] = {x[\"id\"]:x[\"display_text\"][\"rules\"] for x in rule_information[\"rule_set\"]}\n",
    "enc = model.encode(list(rule_repr_dict.values()))\n",
    "rule_index_map = {k:v for v,k in enumerate(rule_repr_dict.keys())}\n",
    "index_rule_map = {k:v for v,k in rule_index_map.items()}\n",
    "\n",
    "norm = np.linalg.norm(enc, axis=1)\n",
    "norm = np.outer(norm,norm) + 1e-6\n",
    "\n",
    "cosine_sim = (enc @ enc.T)/norm\n",
    "cosine_sim = np.abs(cosine_sim)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 183,
   "id": "020fa435",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAgMAAAGdCAYAAACPX3D5AAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjMsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvZiW1igAAAAlwSFlzAAAPYQAAD2EBqD+naQAAMdpJREFUeJzt3X1cVHXe//H3gDB4i5YJSCmaJZqGBsmFVnYlm1f2YHX3saVlabjSry5oVS5NyZTUcixXsxuLbjRb29Kurm6sDHPZ7MqNQkG7NW/StMsENQsM10Fnzu+PHsvuGRA8OnCGzuvZ4/vHnDNzznsIh898v9/zPS7DMAwBAADHCrM7AAAAsBfFAAAADkcxAACAw1EMAADgcBQDAAA4HMUAAAAORzEAAIDDUQwAAOBwFAMAADhcK7sD/MOJw7vtjmCyfMBsuyOYvBF2xO4IJsf8NXZHMHm6fcj8KkuSjlS2sTuCid9w2R3BZFt4a7sjmHzS6oTdEUzCFVr/v741jtkdoY5X9q5p0uMH829SROeeQTtWUwmtT1AAAEKB32d3gmbFMAEAAA5HzwAAAIEMv90JmhXFAAAAgfwUAwAAOJrhsJ4B5gwAAOBw9AwAABCIYQIAAByOYQIAAOAk9AwAABDIYYsOUQwAABCIYQIAAOAk9AwAABCIqwkadvjwYS1fvlzFxcUqLy+XJMXGxmrw4MG67bbbdN555wU9JAAAzYlFhxqwadMmXXzxxXr00UcVHR2tq666SldddZWio6P16KOPKjExUZs3b270OF6vV1VVVabm9XrP+E0AAIAzZ6ln4K677tINN9yggoICuVzm+20bhqE77rhDd911l4qLixs8jsfj0Zw5c0zb7p32B82+e5KVOAAANA2GCU7tk08+0YoVK+oUApLkcrk0ZcoUDRw4sNHj5OXlKTc317Qt7Oh+K1EAAGg6DhsmsFQMxMbGqqSkRImJifXuLykpUUxMTKPHcbvdcrvdpm0nag5biQIAQNNhnYFTmzp1qm6//XaVlpZq2LBhtX/4KyoqVFRUpGeeeUZ//OMfmyQoAABoGpaKgezsbHXu3FkPP/ywnnjiCfl8P1dO4eHhSk5O1ooVK3TjjTc2SVAAAJoNwwQNGz16tEaPHq0TJ07o8OGfu/Y7d+6siIiIoIcDAMAWTCA8PREREYqLiwtmFgAAYANWIAQAIBDDBAAAOJzDhgm4UREAAA5HzwAAAAEMg3UGAABwNofNGWCYAAAAh6NnAACAQA6bQEgxAABAIIcNE1AMAAAQyGE3KmLOAAAADhcyPQPLB8y2O4LJhK1z7Y5gcvPsbLsjmMxce67dEUy2/xBade3+iHC7I5jEnwitbzlLfd/YHcFkgivB7ggm5eGh1UXd29XO7gjNj2ECAAAczmETCEPr6xQAAGh29AwAABCIYQIAAByOYQIAAOAk9AwAABDIYT0DFAMAAARw2l0LGSYAAMDh6BkAACAQwwQAADgclxYCAOBwDusZYM4AAAAOR88AAACBGCYAAMDhGCYAAABOEvRi4Ntvv9WECRMafI7X61VVVZWpnXDYAg8AgBBm+IPXLFq6dKkSEhIUFRWl1NRUlZSUnPK5J06c0Ny5c3XhhRcqKipKSUlJKiwstHzOoBcDR44c0fPPP9/gczwej6Kjo02t8OgXwY4CAMCZ8fuD1yxYvXq1cnNzlZ+fr7KyMiUlJWn48OE6ePBgvc+/99579dRTT+mxxx7Tl19+qTvuuEO/+c1vtGXLFkvntTxnYM2aNQ3u3717d6PHyMvLU25urmnbn/r8P6tRAAD4RVm8eLGysrKUmZkpSSooKNDbb7+t5cuXa8aMGXWev3LlSs2cOVMjRoyQJN155536y1/+okWLFumFF1447fNaLgZGjRoll8slwzBO+RyXy9XgMdxut9xut2lbhCvcahQAAJpGECcQer1eeb1e07b6/g7W1NSotLRUeXl5tdvCwsKUnp6u4uLiUx47KirKtK1169bauHGjpYyWhwni4uL06quvyu/319vKysqsHhIAgNASxDkD9Q2NezyeOqc8fPiwfD6fYmJiTNtjYmJUXl5eb8zhw4dr8eLF2rlzp/x+v9avX69XX31VBw4csPR2LRcDycnJKi0tPeX+xnoNAABwkry8PFVWVprav377PxuPPPKILrroIiUmJioyMlI5OTnKzMxUWJi1P++WhwmmTZum6urqU+7v1auX3nvvPauHBQAgdARxmKC+IYH6dO7cWeHh4aqoqDBtr6ioUGxsbL2vOe+88/T666/r+PHj+v7779W1a1fNmDFDPXv2tJTRcs/AlVdeqf/4j/845f62bdtq6NChVg8LAEDosOHSwsjISCUnJ6uoqKh2m9/vV1FRkdLS0hp8bVRUlOLj43Xy5En9z//8j0aOHGnp7bICIQAAgWxagTA3N1fjx49XSkqKBg0apCVLlqi6urr26oJx48YpPj6+ds7Bxx9/rP3792vAgAHav3+/7rvvPvn9ft19992WzksxAABAiBg9erQOHTqk2bNnq7y8XAMGDFBhYWHtpMJ9+/aZ5gMcP35c9957r3bv3q127dppxIgRWrlypTp27GjpvBQDAAAEsvFGRTk5OcrJyal334YNG0yPhw4dqi+//PKsz0kxAABAIG5UBAAAnISeAQAAAjmsZ4BiAACAQA5bPI9hAgAAHI6eAQAAAjFMAACAw1EM2OONsCN2RzC5eXa23RFMouYutTuCyVdv/qfdEUx+pU52RzApDwut8cYTEaF1i/BPK/bYHcGkd6d4uyOYlLY+aXcEk/2+U9+PBr8MIVMMAAAQMmxcdMgOFAMAAARimAAAAIfj0kIAAOAk9AwAABCIYQIAABzOYcUAwwQAADgcPQMAAATi0kIAAJzN8HM1AQAAcBB6BgAACOSwCYQUAwAABHLYnAGGCQAAcDh6BgAACMQEwob9/e9/18aNG/Xll1/W2Xf8+HH96U9/CkowAABs4/cHr7UAloqBHTt2qE+fPrrqqqvUv39/DR06VAcOHKjdX1lZqczMzEaP4/V6VVVVZWo+w2c9PQAATYFi4NSmT5+ufv366eDBg9q+fbvat2+vIUOGaN++fZZO6vF4FB0dbWq7q3ZbOgYAAAgOS8XAhx9+KI/Ho86dO6tXr1568803NXz4cF155ZXavfv0/5jn5eWpsrLS1Hp26Gk5PAAATcIwgtdaAEvFwN///ne1avXPOYcul0tPPvmkMjIyNHToUO3YseO0juN2u9WhQwdTC3eFW0sOAEBTcdgwgaWrCRITE7V582b16dPHtP3xxx+XJP36178OXjIAANAsLPUM/OY3v9FLL71U777HH39cN910k4wW0iUCAMAp+Y3gtRbAUjGQl5entWvXnnL/E088IX8L6RIBAOCUDH/wWgvACoQAADgcKxACABCohXTvBwvFAAAAAQyHDXkzTAAAgMPRMwAAQCCGCQAAcLgWchVAsFAMAAAQyGE9A8wZAADA4egZAAAgkMOuJqAYAAAgkMOGCUKmGDjmr7E7gsnMtefaHcHkqzf/0+4IJm9vecLuCCaTUmbYHcEkWi67I5h8H2IDghHhIfPRI0n6oHVo5bnYiLA7gsmmmv12R0ATC61/AQAAhAKHXU0QYt8XAAAIATbetXDp0qVKSEhQVFSUUlNTVVJS0uDzlyxZot69e6t169a64IILNGXKFB0/ftzSOSkGAAAIEatXr1Zubq7y8/NVVlampKQkDR8+XAcPHqz3+S+++KJmzJih/Px8bdu2TcuWLdPq1at1zz33WDovxQAAAAEMvz9ozYrFixcrKytLmZmZ6tu3rwoKCtSmTRstX7683ud/+OGHGjJkiG6++WYlJCTo2muv1U033dRob0IgigEAAAIFcZjA6/WqqqrK1Lxeb51T1tTUqLS0VOnp6bXbwsLClJ6eruLi4npjDh48WKWlpbV//Hfv3q21a9dqxIgRlt4uxQAAAE3I4/EoOjra1DweT53nHT58WD6fTzExMabtMTExKi8vr/fYN998s+bOnasrrrhCERERuvDCC3X11VczTAAAwFkLYs9AXl6eKisrTS0vLy8oMTds2KD58+friSeeUFlZmV599VW9/fbbmjdvnqXjcGkhAACBgnhpodvtltvtbvR5nTt3Vnh4uCoqKkzbKyoqFBsbW+9rZs2apVtvvVUTJ06UJPXv31/V1dW6/fbbNXPmTIWFnd53fnoGAAAIZMOlhZGRkUpOTlZRUdE/Y/j9KioqUlpaWr2vOXbsWJ0/+OHh4ZIkwzj9c9MzAABAiMjNzdX48eOVkpKiQYMGacmSJaqurlZmZqYkady4cYqPj6+dc5CRkaHFixdr4MCBSk1N1a5duzRr1ixlZGTUFgWng2IAAIAAhk33Jhg9erQOHTqk2bNnq7y8XAMGDFBhYWHtpMJ9+/aZegLuvfdeuVwu3Xvvvdq/f7/OO+88ZWRk6IEHHrB0XooBAAAC2XijopycHOXk5NS7b8OGDabHrVq1Un5+vvLz88/qnMwZAADA4egZAAAgkMWVA1s6igEAAALZOExgB8vFwLZt2/TRRx8pLS1NiYmJ+uqrr/TII4/I6/Xqlltu0TXXXNPoMbxeb52lGP2GX2EuRi0AAGhulv76FhYWasCAAZo6daoGDhyowsJCXXXVVdq1a5f27t2ra6+9Vn/9618bPU59SzPuO/rNmb4HAACCy8ZbGNvBUjEwd+5cTZs2Td9//72ee+453XzzzcrKytL69etVVFSkadOmacGCBY0ep76lGbu1TzjT9wAAQFAZhhG01hJYKga++OIL3XbbbZKkG2+8UUePHtXvfve72v1jx47Vp59+2uhx3G63OnToYGoMEQAAYA/LcwZcLpekn2+rGBUVpejo6Np97du3V2VlZfDSAQBghxbSvR8slr6OJyQkaOfOnbWPi4uL1a1bt9rH+/btU1xcXPDSAQBgB4fNGbDUM3DnnXfK5/PVPu7Xr59p/zvvvHNaVxMAABDK7FqO2C6WioE77rijwf3z588/qzAAAKD5segQAACB6BkAAMDhnLUaMTcqAgDA6egZAAAgABMIAQBwOocVAwwTAADgcPQMAAAQyGETCCkGAAAI4LQ5AwwTAADgcPQMAAAQiGECezzdPmSiSJK2/xBanSa/Uie7I5hMSplhdwSTRzYvsDuCyck3nrA7gsnJ0i/sjmBy6atD7I5g0tM4ancEk+MnQuvzMNLdy+4Izc5pwwSh9RsHAEAocFjPQGh9/QUAAM2OngEAAAIYDusZoBgAACCQw4oBhgkAAHA4egYAAAjAMAEAAE7nsGKAYQIAAByOngEAAAIwTAAAgMNRDAAA4HBOKwaYMwAAgMPRMwAAQCDDZXeCZhWUYsAwDLlczvrBAQB+uRgmOANut1vbtm0LxqEAAEAzs9QzkJubW+92n8+nBQsW6Nxzz5UkLV68uMHjeL1eeb1e07Yav1+RYUxhAADYz/A7q7fbUjGwZMkSJSUlqWPHjqbthmFo27Ztatu27WkNF3g8Hs2ZM8e0LefcC3XXeb2sxAEAoEk4bZjAUjEwf/58Pf3001q0aJGuueaa2u0RERFasWKF+vbte1rHycvLq9PLsO/y31mJAgAAgsRSMTBjxgwNGzZMt9xyizIyMuTxeBQREWH5pG63W26327SNIQIAQKgwHHY1geW/wJdffrlKS0t16NAhpaSk6PPPP+dKAgDAL4rhD15rCc7o63i7du30/PPPKy8vT+np6fL5fMHOBQCAIy1dulQJCQmKiopSamqqSkpKTvncq6++Wi6Xq067/vrrLZ3zrNYZGDNmjK644gqVlpaqe/fuZ3MoAABChl1XE6xevVq5ubkqKChQamqqlixZouHDh2v79u3q0qVLnee/+uqrqqmpqX38/fffKykpSTfccIOl8571QP3555+vkSNHqm3btmd7KAAAQoJhBK9ZsXjxYmVlZSkzM1N9+/ZVQUGB2rRpo+XLl9f7/HPOOUexsbG1bf369WrTpo3lYoDliAEACBDMnoH61tapbyJ9TU2NSktLlZeXV7stLCxM6enpKi4uPq1zLVu2TGPGjLH8BZ0p/AAANCGPx6Po6GhT83g8dZ53+PBh+Xw+xcTEmLbHxMSovLy80fOUlJTo888/18SJEy1npGcAAIAAwewZqG9tncBegWBYtmyZ+vfvr0GDBll+LcUAAAABrI71N6S+IYH6dO7cWeHh4aqoqDBtr6ioUGxsbIOvra6u1qpVqzR37twzysgwAQAAISAyMlLJyckqKiqq3eb3+1VUVKS0tLQGX/vf//3f8nq9uuWWW87o3PQMAAAQwK5LC3NzczV+/HilpKRo0KBBWrJkiaqrq5WZmSlJGjdunOLj4+vMOVi2bJlGjRpVe8NAqygGAAAIYNdyxKNHj9ahQ4c0e/ZslZeXa8CAASosLKydVLhv3z6FBSzfv337dm3cuFHvvvvuGZ+XYgAAgBCSk5OjnJycevdt2LChzrbevXvLOMtJDhQDAAAEaCn3FAgWigEAAAL4HXbXwpApBo5UtrE7gsn+iHC7I5iUhwXxOpcgiFZo/UM5+cYTdkcwaTXyP+2OYNb9zMcSm8L3azbaHcHEe6K93RFM+kQctTuCyUs1e+2OUMd/2R3gFyZkigEAAEKFXRMI7UIxAABAALsuLbQLxQAAAAGCuQJhS8AKhAAAOBw9AwAABGCYAAAAh3PapYUMEwAA4HD0DAAAEIBLCwEAcDiuJgAAAI5CzwAAAAGcNoGQYgAAgABOmzPAMAEAAA5HzwAAAAGcNoHwrIqB6upqvfzyy9q1a5fi4uJ000036dxzz230dV6vV16v17StxvAp0hVatw0GADiT0+YMWBom6Nu3r44cOSJJ+vbbb9WvXz9NmTJF69evV35+vvr27as9e/Y0ehyPx6Po6GhT+9NPO87sHQAAEGSG4QpaawksFQNfffWVTp48KUnKy8tT165dtXfvXpWUlGjv3r269NJLNXPmzEaPk5eXp8rKSlMb1+7iM3sHAADgrJzxMEFxcbEKCgoUHR0tSWrXrp3mzJmjMWPGNPpat9stt9tt2sYQAQAgVDhtmMByMeBy/fwDOn78uOLi4kz74uPjdejQoeAkAwDAJg6bP2i9GBg2bJhatWqlqqoqbd++Xf369avdt3fv3tOaQAgAAEKHpWIgPz/f9Lhdu3amx2+++aauvPLKs08FAICNGCZoQGAxEGjhwoVnFQYAgFDQUq4CCBZWIAQAwOFYgRAAgAB+uwM0M4oBAAACGGKYAAAAOAg9AwAABPA7bKEBigEAAAL4HTZMQDEAAEAA5gwAAABHoWcAAIAAXFoIAIDDOW2YIGSKgVBbBzr+hM/uCCYnIkLrFs/fh9gA08nSL+yOYNb9XbsTmLQacK3dEUw6+T6wO4LJcVdoff5EuU/aHcHEfTLC7ghoYiFTDAAAECoYJgAAwOGcVgyEWGcvAABobvQMAAAQgAmEAAA4nN9ZtQDDBAAAOB3FAAAAAfxyBa1ZtXTpUiUkJCgqKkqpqakqKSlp8Pk//vijsrOzFRcXJ7fbrYsvvlhr1661dE6GCQAACGDXTQtXr16t3NxcFRQUKDU1VUuWLNHw4cO1fft2denSpc7za2pq9Ktf/UpdunTRK6+8ovj4eO3du1cdO3a0dF6KAQAAAth1aeHixYuVlZWlzMxMSVJBQYHefvttLV++XDNmzKjz/OXLl+vIkSP68MMPFRHx8+JQCQkJls/LMAEAAE3I6/WqqqrK1Lxeb53n1dTUqLS0VOnp6bXbwsLClJ6eruLi4nqPvWbNGqWlpSk7O1sxMTHq16+f5s+fL5/P2iq6FAMAAATwu1xBax6PR9HR0abm8XjqnPPw4cPy+XyKiYkxbY+JiVF5eXm9OXfv3q1XXnlFPp9Pa9eu1axZs7Ro0SLdf//9lt4vwwQAAAQI5pyBvLw85ebmmra53e6gHNvv96tLly56+umnFR4eruTkZO3fv18LFy5Ufn7+aR+HYgAAgCbkdrtP649/586dFR4eroqKCtP2iooKxcbG1vuauLg4RUREKDz8nzez69Onj8rLy1VTU6PIyMjTysgwAQAAAfxBbKcrMjJSycnJKioq+mcOv19FRUVKS0ur9zVDhgzRrl275Pf/80w7duxQXFzcaRcCEsUAAAB1+F3Ba1bk5ubqmWee0fPPP69t27bpzjvvVHV1de3VBePGjVNeXl7t8++8804dOXJEkyZN0o4dO/T2229r/vz5ys7OtnReS8MEZWVl6tSpk3r06CFJWrlypQoKCrRv3z51795dOTk5GjNmTKPH8Xq9dWZS1hg+RbrCT/EKAAB++UaPHq1Dhw5p9uzZKi8v14ABA1RYWFg7qXDfvn0KC/vn9/gLLrhA69at05QpU3TppZcqPj5ekyZN0vTp0y2d11IxkJmZqUWLFqlHjx569tln9Yc//EFZWVm69dZbtX37dmVlZenYsWOaMGFCg8fxeDyaM2eOaduEton6ffu+lsIDANAUzmTlwGDJyclRTk5Ovfs2bNhQZ1taWpo++uijszqnpWJg586duuiiiyRJTzzxhB555BFlZWXV7r/88sv1wAMPNFoM1DezsuzicVaiAADQZOxagdAuloqBNm3a6PDhw+revbv279+vQYMGmfanpqZqz549jR6nvpmVDBEAAGAPSxMIr7vuOj355JOSpKFDh+qVV14x7X/55ZfVq1ev4KUDAMAGdk0gtIulnoEHH3xQQ4YM0dChQ5WSkqJFixZpw4YN6tOnj7Zv366PPvpIr732WlNlBQCgWdh1bwK7WOoZ6Nq1q7Zs2aK0tDQVFhbKMAyVlJTo3Xff1fnnn6+//e1vGjFiRFNlBQCgWRhBbC2B5RUIO3bsqAULFmjBggVNkQcAADQzliMGACBASxnrDxaKAQAAAjBnAAAAOAo9AwAABHBazwDFAAAAAQyHzRlgmAAAAIejZwAAgAAMEwAA4HBOKwYYJgAAwOHoGQAAIEBLWUY4WEKmGNgW3truCCZLfd/YHcHk04rGbw3dnCLCQ+ZXR5J06atD7I5g8v2ajXZHMOnk+8DuCCYjP5tndwSThIsy7I5gcnFYV7sjmBzw/mB3hGbHCoQAADgccwYAAICj0DMAAEAAp/UMUAwAABDAaRMIGSYAAMDh6BkAACAAVxMAAOBwTpszwDABAAAOR88AAAABnDaBkGIAAIAAfoeVAwwTAADgcPQMAAAQwGkTCCkGAAAI4KxBAooBAADqcFrPgKU5A3fddZc++CC0boUKAADOjqViYOnSpbr66qt18cUX68EHH1R5efkZndTr9aqqqsrUThi+MzoWAADB5ncFr7UElq8mePfddzVixAj98Y9/VLdu3TRy5Ei99dZb8vtPv1PF4/EoOjra1NYe/cJqFAAAmoRfRtBaS2C5GOjfv7+WLFmi7777Ti+88IK8Xq9GjRqlCy64QDNnztSuXbsaPUZeXp4qKytNbUT7S87oDQAAgLNzxusMRERE6MYbb1RhYaF2796trKws/fnPf1bv3r0bfa3b7VaHDh1MLcIVfqZRAAAIKiOIrSUIyqJD3bp103333ac9e/aosLAwGIcEAMA2/iC2lsBSMdC9e3eFh5/6G7zL5dKvfvWrsw4FAACaj6V1Bvbs2dNUOQAACBktZeJfsLDoEAAAAZxVCnCjIgAAHI+eAQAAArSUiX/BQs8AAAAB7Fx0aOnSpUpISFBUVJRSU1NVUlJyyueuWLFCLpfL1KKioiyfk2IAAIAAdq0zsHr1auXm5io/P19lZWVKSkrS8OHDdfDgwVO+pkOHDjpw4EBt27t3r8WzUgwAABAyFi9erKysLGVmZqpv374qKChQmzZttHz58lO+xuVyKTY2trbFxMRYPi/FAAAAAYK56FB9N+fzer11zllTU6PS0lKlp6fXbgsLC1N6erqKi4tPmfWnn35S9+7ddcEFF2jkyJH64gvr9/qhGAAAIIARxP/quzmfx+Opc87Dhw/L5/PV+WYfExNzyrsE9+7dW8uXL9cbb7yhF154QX6/X4MHD9b//d//WXq/XE0AAEATysvLU25urmmb2+0OyrHT0tKUlpZW+3jw4MHq06ePnnrqKc2bN++0j0MxAABAgGBeWuh2u0/rj3/nzp0VHh6uiooK0/aKigrFxsae1rkiIiI0cODA07qD8L8KmWLgk1Yn7I5gMsGVYHcEk96d4u2OYPJB65D51ZEk9TSO2h3BxHuivd0RTI67XHZHMEm4KMPuCCbf7HzT7ggmeSkz7Y5gUh1ZY3eEZmfHcsSRkZFKTk5WUVGRRo0a9XMOv19FRUXKyck5rWP4fD599tlnGjFihKVzh9YnOgAADpabm6vx48crJSVFgwYN0pIlS1RdXa3MzExJ0rhx4xQfH18752Du3Ln6t3/7N/Xq1Us//vijFi5cqL1792rixImWzksxAABAALvuTTB69GgdOnRIs2fPVnl5uQYMGKDCwsLaSYX79u1TWNg/5/7/8MMPysrKUnl5uTp16qTk5GR9+OGH6tu3r6XzUgwAABDAzrsW5uTknHJYYMOGDabHDz/8sB5++OGzPieXFgIA4HD0DAAAEMBpNyqiGAAAIIBh4zCBHSgGAAAI4LSeAeYMAADgcPQMAAAQgGECAAAcjmECAADgKPQMAAAQwG8wTAAAgKM5qxRgmAAAAMejZwAAgAB23pvADpZ7Bh5//HGNGzdOq1atkiStXLlSffv2VWJiou655x6dPHmy0WN4vV5VVVWZms/wWU8PAEATMIL4X0tgqRi4//77dc899+jYsWOaMmWKHnzwQU2ZMkVjx47V+PHj9eyzz2revHmNHsfj8Sg6OtrUNlduO+M3AQAAzpylYYIVK1ZoxYoV+u1vf6tPPvlEycnJev755zV27FhJUmJiou6++27NmTOnwePk5eUpNzfXvK3/BIvRAQBoGk5bZ8BSMfDdd98pJSVFkpSUlKSwsDANGDCgdv9ll12m7777rtHjuN1uud1u07ZwV7iVKAAANBnmDDQgNjZWX375pSRp586d8vl8tY8l6YsvvlCXLl2CmxAAgGbmtDkDlnoGxo4dq3HjxmnkyJEqKirS3XffralTp+r777+Xy+XSAw88oN/97ndNlRUAADQBS8XAnDlz1Lp1axUXFysrK0szZsxQUlKS7r77bh07dkwZGRmnNYEQAIBQxpyBBoSFhemee+4xbRszZozGjBkT1FAAANjJcNhyxKxACACAw7ECIQAAAZx2NQHFAAAAAZw2Z4BhAgAAHI6eAQAAArSU9QGChWIAAIAATpszwDABAAAOR88AAAABnLbOAMUAAAABnHY1AcUAAAABmEBok3C57I5gUh4eWnVhaeuTdkcwudiIsDuCyfETIfOrLEnqE3HU7ggmUe4Q+/0J62p3BJO8lJl2RzDxbH7A7ggmywfMtjsCmlhofYICABACnHY1AcUAAAABnDaBkEsLAQBwOHoGAAAIwDABAAAO57SrCRgmAADA4egZAAAggN9hEwgpBgAACOCsUoBhAgAAHI+eAQAAAnA1AQAADue0YoBhAgAAAhiGEbRm1dKlS5WQkKCoqCilpqaqpKTktF63atUquVwujRo1yvI5KQYAAAgRq1evVm5urvLz81VWVqakpCQNHz5cBw8ebPB133zzjaZOnaorr7zyjM5LMQAAQAC/jKA1KxYvXqysrCxlZmaqb9++KigoUJs2bbR8+fJTvsbn82ns2LGaM2eOevbseUbv13IxcODAAc2ePVvXXHON+vTpo0suuUQZGRlatmyZfD7fGYUAACCUGEH8z+v1qqqqytS8Xm+dc9bU1Ki0tFTp6em128LCwpSenq7i4uJTZp07d666dOmi3//+92f8fi0VA5s3b1afPn20du1anThxQjt37lRycrLatm2rqVOn6qqrrtLRo43fx72+H8xJg0ICAPDL4/F4FB0dbWoej6fO8w4fPiyfz6eYmBjT9piYGJWXl9d77I0bN2rZsmV65plnziqjpWJg8uTJmjJlijZv3qwPPvhAK1as0I4dO7Rq1Srt3r1bx44d07333tvocer7wWyq3HbGbwIAgGAK5gTCvLw8VVZWmlpeXt5ZZzx69KhuvfVWPfPMM+rcufNZHctSMVBWVqZbb7219vHNN9+ssrIyVVRUqFOnTnrooYf0yiuvNHqc+n4wl0f3sZ4eAIAmEMw5A263Wx06dDA1t9td55ydO3dWeHi4KioqTNsrKioUGxtb5/lff/21vvnmG2VkZKhVq1Zq1aqV/vSnP2nNmjVq1aqVvv7669N+v5aKgS5duujAgQOmgCdPnlSHDh0kSRdddJGOHDnS6HHq+8G0coVbiQIAwC9KZGSkkpOTVVRUVLvN7/erqKhIaWlpdZ6fmJiozz77TFu3bq1tv/71r/Xv//7v2rp1qy644ILTPrelRYdGjRqlO+64QwsXLpTb7da8efM0dOhQtW7dWpK0fft2xcfHWzkkAAAh50zWBwiG3NxcjR8/XikpKRo0aJCWLFmi6upqZWZmSpLGjRun+Ph4eTweRUVFqV+/fqbXd+zYUZLqbG+MpWLg/vvv14EDB5SRkSGfz6e0tDS98MILtftdLle9kyIAAGhJ7FqBcPTo0Tp06JBmz56t8vJyDRgwQIWFhbWTCvft26ewsOCvCmCpGGjXrp1Wr16t48eP6+TJk2rXrp1p/7XXXhvUcAAAOE1OTo5ycnLq3bdhw4YGX7tixYozOucZ3ZsgKirqjE4GAEBLYDjs3gTcqAgAgAB+m+YM2IViAACAAE7rGeDeBAAAOBw9AwAABGCYAAAAh2OYAAAAOAo9AwAABGCYAAAAh2OYAAAAOAo9AwAABGCYwCbfGsfsjmDS29Wu8Sc1o/2+arsjmGyq2W93BJNIdy+7I5i8VLPX7ggm7pMRdkcwOeD9we4IJtWRNXZHMFk+YLbdEUwmbJ1rd4RmxzABAABwlJDpGQAAIFQYht/uCM2KYgAAgAB+hw0TUAwAABDAcNgEQuYMAADgcPQMAAAQgGECAAAcjmECAADgKPQMAAAQgBUIAQBwOFYgBAAAjnJGPQM1NTV6/fXXVVxcrPLycklSbGysBg8erJEjRyoyMjKoIQEAaE5MIGzErl271KdPH40fP15btmyR3++X3+/Xli1bNG7cOF1yySXatWtXU2QFAKBZ+GUErbUElnsG7rzzTvXv319btmxRhw4dTPuqqqo0btw4ZWdna926dUELCQAAmo7lYuBvf/ubSkpK6hQCktShQwfNmzdPqampDR7D6/XK6/WatvkMn8Jd4VbjAAAQdAwTNKJjx4765ptvTrn/m2++UceOHRs8hsfjUXR0tKltr2RoAQAQGvyGEbTWElguBiZOnKhx48bp4Ycf1qeffqqKigpVVFTo008/1cMPP6zbbrtNt99+e4PHyMvLU2Vlpan1ju51xm8CAIBgMgwjaK0lsDxMMHfuXLVt21YLFy7Uf/3Xf8nlckn6+QcXGxur6dOn6+67727wGG63W26327SNIQIAAOxxRpcWTp8+XdOnT9eePXtMlxb26NEjqOEAALBDS7kKIFjOagXCHj161CkAvv32W+Xn52v58uVnFQwAALu0lO79YAn6CoRHjhzR888/H+zDAgCAJmK5Z2DNmjUN7t+9e/cZhwEAIBS0lKsAgsVyMTBq1Ci5XK4Gu1D+MakQAICWiBsVNSIuLk6vvvpq7TLEga2srKwpcgIAgCZiuRhITk5WaWnpKfc31msAAECoc9qiQ5aHCaZNm6bq6upT7u/Vq5fee++9swoFAICdnPal1nIxcOWVVza4v23btho6dOgZBwIAAM3rrNYZAADgl8hpEwgpBgAACMAwAQAADue0YiDoKxACAICWhZ4BAAACOKtfQJLxC3L8+HEjPz/fOH78uN1RDMMgT2PI0zDyNIw8DSMPrHAZxi9nYKSqqkrR0dGqrKxUhw4d7I5DHvKQhzzkCdE8MGPOAAAADkcxAACAw1EMAADgcL+oYsDtdis/P19ut9vuKJLI0xjyNIw8DSNPw8gDK35REwgBAIB1v6ieAQAAYB3FAAAADkcxAACAw1EMAADgcL+YYmDp0qVKSEhQVFSUUlNTVVJSYluW//3f/1VGRoa6du0ql8ul119/3bYskuTxeHT55Zerffv26tKli0aNGqXt27fblufJJ5/UpZdeqg4dOqhDhw5KS0vTO++8Y1uef7VgwQK5XC5NnjzZtgz33XefXC6XqSUmJtqWR5L279+vW265Reeee65at26t/v37a/PmzbZkSUhIqPPzcblcys7OtiWPz+fTrFmz1KNHD7Vu3VoXXnih5s2bZ+td744eParJkyere/fuat26tQYPHqxNmzY1y7kb+/wzDEOzZ89WXFycWrdurfT0dO3cubNZsuHUfhHFwOrVq5Wbm6v8/HyVlZUpKSlJw4cP18GDB23JU11draSkJC1dutSW8wd6//33lZ2drY8++kjr16/XiRMndO2116q6utqWPOeff74WLFig0tJSbd68Wddcc41GjhypL774wpY8/7Bp0yY99dRTuvTSS23NIUmXXHKJDhw4UNs2btxoW5YffvhBQ4YMUUREhN555x19+eWXWrRokTp16mRLnk2bNpl+NuvXr5ck3XDDDbbkefDBB/Xkk0/q8ccf17Zt2/Tggw/qoYce0mOPPWZLHkmaOHGi1q9fr5UrV+qzzz7Ttddeq/T0dO3fv7/Jz93Y599DDz2kRx99VAUFBfr444/Vtm1bDR8+XMePH2/ybGiAnTdGCJZBgwYZ2dnZtY99Pp/RtWtXw+Px2JjqZ5KM1157ze4YJgcPHjQkGe+//77dUWp16tTJePbZZ207/9GjR42LLrrIWL9+vTF06FBj0qRJtmXJz883kpKSbDt/oOnTpxtXXHGF3TFOadKkScaFF15o+P1+W85//fXXGxMmTDBt++1vf2uMHTvWljzHjh0zwsPDjbfeesu0/bLLLjNmzpzZrFkCP//8fr8RGxtrLFy4sHbbjz/+aLjdbuOll15q1mwwa/E9AzU1NSotLVV6enrttrCwMKWnp6u4uNjGZKGrsrJSknTOOefYnOTnLtZVq1apurpaaWlptuXIzs7W9ddfb/o9stPOnTvVtWtX9ezZU2PHjtW+fftsy7JmzRqlpKTohhtuUJcuXTRw4EA988wztuX5VzU1NXrhhRc0YcIEuVwuWzIMHjxYRUVF2rFjhyTpk08+0caNG3XdddfZkufkyZPy+XyKiooybW/durWtPUyStGfPHpWXl5v+nUVHRys1NZXPa5u1sjvA2Tp8+LB8Pp9iYmJM22NiYvTVV1/ZlCp0+f1+TZ48WUOGDFG/fv1sy/HZZ58pLS1Nx48fV7t27fTaa6+pb9++tmRZtWqVysrKmm1MtTGpqalasWKFevfurQMHDmjOnDm68sor9fnnn6t9+/bNnmf37t168sknlZubq3vuuUebNm3SH/7wB0VGRmr8+PHNnudfvf766/rxxx9122232ZZhxowZqqqqUmJiosLDw+Xz+fTAAw9o7NixtuRp37690tLSNG/ePPXp00cxMTF66aWXVFxcrF69etmS6R/Ky8slqd7P63/sgz1afDEAa7Kzs/X555/b/g2hd+/e2rp1qyorK/XKK69o/Pjxev/995u9IPj22281adIkrV+/vs43Kbv86zfKSy+9VKmpqerevbtefvll/f73v2/2PH6/XykpKZo/f74kaeDAgfr8889VUFBgezGwbNkyXXfdderatattGV5++WX9+c9/1osvvqhLLrlEW7du1eTJk9W1a1fbfj4rV67UhAkTFB8fr/DwcF122WW66aabVFpaaksehL4WP0zQuXNnhYeHq6KiwrS9oqJCsbGxNqUKTTk5OXrrrbf03nvv6fzzz7c1S2RkpHr16qXk5GR5PB4lJSXpkUceafYcpaWlOnjwoC677DK1atVKrVq10vvvv69HH31UrVq1ks/na/ZMgTp27KiLL75Yu3btsuX8cXFxdYq0Pn362Dp0IUl79+7VX/7yF02cONHWHNOmTdOMGTM0ZswY9e/fX7feequmTJkij8djW6YLL7xQ77//vn766Sd9++23Kikp0YkTJ9SzZ0/bMkmq/Uzm8zr0tPhiIDIyUsnJySoqKqrd5vf7VVRUZOsYdCgxDEM5OTl67bXX9Ne//lU9evSwO1Idfr9fXq+32c87bNgwffbZZ9q6dWttS0lJ0dixY7V161aFh4c3e6ZAP/30k77++mvFxcXZcv4hQ4bUuRR1x44d6t69uy15/uG5555Tly5ddP3119ua49ixYwoLM3+UhoeHy+/325Ton9q2bau4uDj98MMPWrdunUaOHGlrnh49eig2Ntb0eV1VVaWPP/6Yz2ub/SKGCXJzczV+/HilpKRo0KBBWrJkiaqrq5WZmWlLnp9++sn0LW7Pnj3aunWrzjnnHHXr1q3Z82RnZ+vFF1/UG2+8ofbt29eOzUVHR6t169bNnicvL0/XXXedunXrpqNHj+rFF1/Uhg0btG7dumbP0r59+zpzJ9q2batzzz3XtjkVU6dOVUZGhrp3767vvvtO+fn5Cg8P10033WRLnilTpmjw4MGaP3++brzxRpWUlOjpp5/W008/bUse6efi8bnnntP48ePVqpW9H2MZGRl64IEH1K1bN11yySXasmWLFi9erAkTJtiWad26dTIMQ71799auXbs0bdo0JSYmNstnYmOff5MnT9b999+viy66SD169NCsWbPUtWtXjRo1qsmzoQF2X84QLI899pjRrVs3IzIy0hg0aJDx0Ucf2ZblvffeMyTVaePHj7clT31ZJBnPPfecLXkmTJhgdO/e3YiMjDTOO+88Y9iwYca7775rS5b62H1p4ejRo424uDgjMjLSiI+PN0aPHm3s2rXLtjyGYRhvvvmm0a9fP8PtdhuJiYnG008/bWuedevWGZKM7du325rDMAyjqqrKmDRpktGtWzcjKirK6NmzpzFz5kzD6/Xalmn16tVGz549jcjISCM2NtbIzs42fvzxx2Y5d2Off36/35g1a5YRExNjuN1uY9iwYSHx/9HpuIUxAAAO1+LnDAAAgLNDMQAAgMNRDAAA4HAUAwAAOBzFAAAADkcxAACAw1EMAADgcBQDAAA4HMUAAAAORzEAAIDDUQwAAOBwFAMAADjc/wcp4UwNCsibWQAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 640x480 with 2 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "import seaborn as sns\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "sns.heatmap(cosine_sim)\n",
    "\n",
    "plt.savefig('RRSim_heatmap.png', dpi=600, bbox_inches='tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 184,
   "id": "9f47d1fc",
   "metadata": {},
   "outputs": [],
   "source": [
    "rule_codition_similarity = np.argsort(cosine_sim, axis=-1)\n",
    "\n",
    "rule_id_similarity_map = {}\n",
    "for k,v in rule_index_map.items():\n",
    "    rule_id_similarity_map[k] = [index_rule_map[x] for x in rule_codition_similarity[v]]"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3aa49c3b",
   "metadata": {},
   "source": [
    "# Dataset Creation "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 185,
   "id": "0bf54815",
   "metadata": {},
   "outputs": [],
   "source": [
    "random.seed(420)\n",
    "np.random.seed(420)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 186,
   "id": "bc998796",
   "metadata": {},
   "outputs": [],
   "source": [
    "rule_information = file_handle.load_pickle(\n",
    "    os.path.join(\"../dataset/test_datasets/TEST_TreeStruct.pkl\")\n",
    ")\n",
    "\n",
    "asset_descriptions = ds.asset_descriptions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 187,
   "id": "e9f593bb",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<dataset.utils.tree.Node object at 0x7f53b6337f90>\n"
     ]
    }
   ],
   "source": [
    "for  x in rule_information[\"rule_set\"]:\n",
    "    if x[\"id\"] == \"TEST_RULE_CT00004\":\n",
    "        print(x[\"display_text\"][\"rules\"])"
   ]
  },
  {
   "cell_type": "raw",
   "id": "5d069246",
   "metadata": {},
   "source": [
    "question_id: <unique_id>  # e.g., WTWQ-001\n",
    "date_detected: <MM/DD/YYYY>\n",
    "asset_type: <Asset Type>  # e.g., AHU, Chiller, VAV\n",
    "condition_description: |\n",
    "  - <Condition 1>\n",
    "  - <Condition 2>\n",
    "  - <Condition 3>\n",
    "  - ...\n",
    "  - Condition met for <duration>\n",
    "question_prompt: |\n",
    "  Given the above detected condition, what should the operator look for?\n",
    "options:\n",
    "  - A) <Correct action>\n",
    "  - B) <Distractor 1>\n",
    "  - C) <Distractor 2>\n",
    "  - D) <Distractor 3>\n",
    "answer: A\n",
    "rationale: |\n",
    "  The condition suggests <explanation>. Therefore, the correct response is to <action>.\n",
    "tags:\n",
    "  - condition_type: <e.g., sensor-stuck, flow-imbalance>\n",
    "  - asset_zone: <e.g., VAV zone, hot deck, chilled loop>\n",
    "  - response_type: <e.g., investigate, recalibrate, replace, tune BMS logic>\n",
    "difficulty: <Entry-level | Intermediate | Advanced>"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 188,
   "id": "eab0676c",
   "metadata": {},
   "outputs": [],
   "source": [
    "from dataset_utils import creation, config\n",
    "\n",
    "\n",
    "dataset_config = config.DatasetCreationConfig({\n",
    "    \"num_options\":4,\n",
    "    \"question_template_mode\":config.QuestionTemplateMode.random,\n",
    "    \"sel_random_sample\": 2,\n",
    "    'elem_random_sample':2,\n",
    "    \"question_template_random_count\" : 1,\n",
    "    \"n_least_sim_rules\":2\n",
    "})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 189,
   "id": "8765b170",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'subject': 'diagnosis_sense_simple_question_analysis',\n",
       " 'db_acronym': 'ADIQ',\n",
       " 'db_name': 'AssetDiagnosisIQ',\n",
       " 'option_choices_string': 'ABCDEFGHIJKLMNOPQRSTUVWXYZ',\n",
       " 'question_first': None,\n",
       " 'text_type': 'choice',\n",
       " 'relevancy': None,\n",
       " 'num_options': 4,\n",
       " 'question_template_mode': 'random',\n",
       " 'question_template_pre_select_options': [0],\n",
       " 'question_template_random_count': 1,\n",
       " 'sel_random_sample': 2,\n",
       " 'elem_random_sample': 2,\n",
       " 'n_least_sim_rules': 2,\n",
       " 'question_condition_template': '\\n## Asset Description:\\n{asset_type}: {asset_description}\\n\\n## Conditions:\\n{conditions}\\n\\n{question_prompt}\\n'}"
      ]
     },
     "execution_count": 189,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dataset_config.to_config()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 190,
   "id": "86902eae",
   "metadata": {},
   "outputs": [],
   "source": [
    "dataset = creation.create_dataset(\n",
    "    rule_information,\n",
    "    obs_mapping,\n",
    "    asset_descriptions,\n",
    "    rule_id_similarity_map,\n",
    "    dataset_config\n",
    "    )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 191,
   "id": "076fc822",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "176"
      ]
     },
     "execution_count": 191,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(dataset[\"questions\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 192,
   "id": "4d12ecd4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Overridding Dataset\n"
     ]
    }
   ],
   "source": [
    "creation.save_dataset(\n",
    "    dataset,\n",
    "    \"simpleTestV1\",\n",
    "    \"test_datasets/datasets\"\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 193,
   "id": "ed742837",
   "metadata": {},
   "outputs": [],
   "source": [
    "from dataset_utils.reader import ADIQDataset\n",
    "from dataset_utils.outputs import to_basic_prompt\n",
    "\n",
    "ds = ADIQDataset(\"test_datasets/datasets/simpleTestV1\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 194,
   "id": "b2eb100b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "176"
      ]
     },
     "execution_count": 194,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(ds.questions)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 195,
   "id": "1595ef2b",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 176/176 [00:00<00:00, 11411.31it/s]\n"
     ]
    }
   ],
   "source": [
    "from collections import Counter\n",
    "\n",
    "for que1 in tqdm(ds.questions):\n",
    "    flag = True\n",
    "    dup_id = None\n",
    "    for que2 in ds.questions:\n",
    "        if que1.id == que2.id:\n",
    "            continue\n",
    "\n",
    "        if que1.asset_type == que2.asset_type:\n",
    "            if que1.condition_description == que2.condition_description:\n",
    "                if Counter(que1.options) == Counter(que2.options):\n",
    "                    print(que1, que2)\n",
    "                    flag = False\n",
    "                    dup_id = que2.id\n",
    "\n",
    "    if not flag:\n",
    "        print(que1.id, dup_id)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 196,
   "id": "3ae7edad",
   "metadata": {},
   "outputs": [],
   "source": [
    "question_template = \"\"\"\n",
    "## Asset Description:\n",
    "{asset_type}: {asset_description}\n",
    "\n",
    "## Conditions:\n",
    "{conditions}\n",
    "\n",
    "## How long the conditions were met:\n",
    "{temporal_condition}\n",
    "\n",
    "{question_prompt}\n",
    "{options}\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 197,
   "id": "ef5372cf",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "## Asset Description:\n",
      "Chiller: A device that removes heat from a liquid through a vapor-compression or vapor-absorption refrigeration process. The cooled liquid can then be used to cool equipment, buildings, or other systems.\n",
      "\n",
      "## Conditions:\n",
      "- Chiller Running\n",
      "- VFD Speed % > 97%\n",
      "- (Chilled Water Supply Temp - Chilled Water Supply Temp Setpoint ) < -2 degF\n",
      "\n",
      "## How long the conditions were met:\n",
      "Met for 4 Hours\n",
      "\n",
      "Given what is known about the asset’s conditions, which explanation makes the MOST sense?\n",
      "A). Too few pumps running\n",
      "B). System leak\n",
      "C). Power Meter Current Transformer issue\n",
      "D). Conductivity meter issue causing excessive blowdown\n",
      "\n"
     ]
    }
   ],
   "source": [
    "print(to_basic_prompt(ds.questions[100],question_template, ds.asset_descriptions))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 198,
   "id": "1a3aece2",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(5, [True, False, False, False])"
      ]
     },
     "execution_count": 198,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ds.questions[100].rule_id, ds.questions[100].correct"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 199,
   "id": "78beb78f",
   "metadata": {},
   "outputs": [],
   "source": [
    "q_type_stats = {\"p\":0,\"n\":0}\n",
    "for q in ds.questions:\n",
    "    if q.question_type == \"positive\":\n",
    "        q_type_stats[\"p\"] += 1\n",
    "    else:\n",
    "        q_type_stats[\"n\"] += 1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 200,
   "id": "77b54638",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'p': 142, 'n': 34}"
      ]
     },
     "execution_count": 200,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "q_type_stats"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 201,
   "id": "1a205402",
   "metadata": {},
   "outputs": [],
   "source": [
    "opt_comp = {}\n",
    "for q in ds.questions:\n",
    "    try:\n",
    "        opt_comp[len(q.options)] += 1\n",
    "    except KeyError as er:\n",
    "        opt_comp[len(q.options)] = 1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 202,
   "id": "84eb84c7",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{4: 142, 3: 34}"
      ]
     },
     "execution_count": 202,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "opt_comp"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "28b72099",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
