{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "05566ac8",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[nltk_data] Downloading package stopwords to /root/nltk_data...\n",
      "[nltk_data]   Package stopwords is already up-to-date!\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import os\n",
    "import fitz\n",
    "import re\n",
    "import json\n",
    "from datetime import datetime\n",
    "from typing import Optional, List, Callable, Any, Tuple, Dict, Set\n",
    "from abc import abstractmethod, ABC\n",
    "import random\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import copy\n",
    "import nltk\n",
    "from nltk.corpus import stopwords\n",
    "import pickle\n",
    "import itertools\n",
    "\n",
    "nltk.download('stopwords')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "87345fb7",
   "metadata": {},
   "outputs": [],
   "source": [
    "import utils.file_handle as file_handle\n",
    "import utils.tree as tree_func\n",
    "from utils.tree import Node"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "208078b2",
   "metadata": {},
   "outputs": [],
   "source": [
    "data = file_handle.load_pickle(\"extracted/TreeStruct.pkl\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "861b24ba",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_num_leafNode(root:Node):\n",
    "    if not root.children:\n",
    "        if root.statement:\n",
    "            if \"Met\" in root.statement:\n",
    "                return 0\n",
    "            else:\n",
    "                return 1\n",
    "        else:\n",
    "            return 1\n",
    "    \n",
    "    num = 0\n",
    "    for c in root.children:\n",
    "        num += get_num_leafNode(c)\n",
    "\n",
    "    return num\n",
    "\n",
    "\n",
    "def get_num_conditionNode(root:Node):\n",
    "    if root.ops:\n",
    "        num = 1 if root.ops == \"OR\" else 0\n",
    "    else:\n",
    "        num = 0\n",
    "\n",
    "    for c in root.children:\n",
    "        num += get_num_conditionNode(c)\n",
    "\n",
    "    return num\n",
    "\n",
    "def get_num_allNode(root:Node):\n",
    "    if not root.children:\n",
    "        if root.statement:\n",
    "            if \"Met\" in root.statement:\n",
    "                return 0\n",
    "            else:\n",
    "                return 1\n",
    "        else:\n",
    "            return 0\n",
    "        \n",
    "    num = len(root.children) if root.children else 0\n",
    "    for c in root.children:\n",
    "        num += get_num_allNode(c)\n",
    "\n",
    "    return num\n",
    "\n",
    "def each_rule_stats(rule):\n",
    "    _data = {\n",
    "        \"asset_type\" : rule[\"asset\"]\n",
    "    }\n",
    "\n",
    "    _data[\"conditions\"] = {\n",
    "        \"leaf\":get_num_leafNode(rule[\"display_text\"][\"rules\"]),\n",
    "        \"conditional\":get_num_conditionNode(rule[\"display_text\"][\"rules\"]) - get_num_leafNode(rule[\"display_text\"][\"rules\"]) -1,\n",
    "        \"all\": get_num_allNode(rule[\"display_text\"][\"rules\"]) -1\n",
    "    }\n",
    "\n",
    "    _data[\"observations\"] = len(rule[\"display_text\"][\"observations\"])\n",
    "\n",
    "    return _data\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "c598dc54",
   "metadata": {},
   "outputs": [],
   "source": [
    "stats = []\n",
    "for rule in data[\"rule_set\"]:\n",
    "    resp = each_rule_stats(rule)\n",
    "    stats.append(resp)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "d4ad2c0d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Meter 3 4 4 4\n",
      "Boiler 6 5 17 19\n",
      "AHU 55 54 312 172\n",
      "Fan 1 0 4 4\n",
      "HXU 4 0 12 9\n",
      "Chiller 11 0 26 27\n",
      "Air Compressor 3 1 6 8\n",
      "VAV 8 3 30 18\n",
      "UPS 1 1 2 1\n",
      "None 1 0 5 3\n",
      "PDU 3 0 7 3\n",
      "Pump 5 1 20 22\n",
      "AHU Humidity 1 0 3 1\n",
      "Lighting 1 1 2 2\n",
      "Plate & Frame 1 1 4 4\n",
      "PIU 2 1 5 5\n",
      "Cooling Tower 4 1 11 12\n",
      "CRAC 10 0 21 28\n"
     ]
    }
   ],
   "source": [
    "unq_asset_types = set([x['asset_type'] for x in stats])\n",
    "asst_type_map = {v:k for k,v in enumerate(unq_asset_types)}\n",
    "ind_asst_type_map = {k:v for v,k in asst_type_map.items()}\n",
    "\n",
    "asset_types = np.array([asst_type_map[x['asset_type']] for x in stats])\n",
    "_t,_c = np.unique(asset_types, return_counts=True)\n",
    "\n",
    "conditional_count = {}\n",
    "number_conditions = {}\n",
    "observation_count = {}\n",
    "\n",
    "for x in stats:\n",
    "    try:\n",
    "        conditional_count[x['asset_type']] += x['conditions'][\"conditional\"]\n",
    "    except KeyError as ke:\n",
    "        conditional_count[x['asset_type']] = x['conditions'][\"conditional\"]\n",
    "\n",
    "    try:\n",
    "        number_conditions[x['asset_type']] += x['conditions'][\"leaf\"]\n",
    "    except KeyError as ke:\n",
    "        number_conditions[x['asset_type']] = x['conditions'][\"leaf\"]\n",
    "    \n",
    "    try:\n",
    "        observation_count[x['asset_type']] += x['observations']\n",
    "    except KeyError as ke:\n",
    "        observation_count[x['asset_type']] = x['observations']\n",
    "\n",
    "\n",
    "\n",
    "for k,v in zip(_t,_c):\n",
    "    print(ind_asst_type_map[k],v, conditional_count[ind_asst_type_map[k]], number_conditions[ind_asst_type_map[k]], observation_count[ind_asst_type_map[k]])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5ebc4e9c",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
