{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "9d386407",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[nltk_data] Downloading package stopwords to /root/nltk_data...\n",
      "[nltk_data]   Package stopwords is already up-to-date!\n"
     ]
    }
   ],
   "source": [
    "import os, sys\n",
    "import fitz\n",
    "import re\n",
    "import json\n",
    "from datetime import datetime\n",
    "from typing import Optional, List, Callable, Any, Tuple, Dict, Self, Union, TypedDict\n",
    "from abc import abstractmethod, ABC\n",
    "import random\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import copy\n",
    "import nltk\n",
    "from nltk.corpus import stopwords\n",
    "import pickle\n",
    "from tqdm.autonotebook import tqdm\n",
    "import itertools\n",
    "from dotenv import load_dotenv\n",
    "\n",
    "sys.path.append(\"../\")\n",
    "\n",
    "load_dotenv(dotenv_path=\"../.env\")\n",
    "nltk.download('stopwords')\n",
    "\n",
    "random.seed(42)\n",
    "np.random.seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "a4ec5e0b",
   "metadata": {},
   "outputs": [],
   "source": [
    "BENCH_TAG = \"basic_bench\"\n",
    "BENCH_ID = str(datetime.now().isoformat())\n",
    "SAVE_LOC = os.path.join(\"results\",BENCH_TAG, BENCH_ID)\n",
    "#os.makedirs(SAVE_LOC, exist_ok=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "1a17defe",
   "metadata": {},
   "outputs": [],
   "source": [
    "from dataset.dataset_utils.reader import ADIQDataset\n",
    "from dataset.dataset_utils.question import Question\n",
    "from dataset.utils import file_handle\n",
    "\n",
    "\n",
    "ds = ADIQDataset(\"../dataset/datasets/simplePertV3.1\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "98f4f248",
   "metadata": {},
   "outputs": [],
   "source": [
    "from sentence_transformers import SentenceTransformer, util\n",
    "from dataset.utils import file_handle\n",
    "\n",
    "\n",
    "emb_model = SentenceTransformer(\"all-mpnet-base-v2\")\n",
    "\n",
    "def get_db_data(loc = \"../dataset/extracted/taxonomy/concepts_reduced.json\"):\n",
    "    db = file_handle.load_json(loc)\n",
    "    list_keys = list(db.keys())\n",
    "    keys_map = {k:v for k,v in enumerate(list_keys)}\n",
    "\n",
    "    db_enc = emb_model.encode(list_keys)\n",
    "\n",
    "    return keys_map, db, db_enc\n",
    "\n",
    "DB_KEY_MAP, DB, DB_ENC = get_db_data()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "13c45e48",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "def get_search_terms(terms:List[str], n =5):\n",
    "    sen_enc = emb_model.encode(terms)\n",
    "    \n",
    "    sim = sen_enc@DB_ENC.T\n",
    "    norm = np.linalg.norm(sim, axis=0)\n",
    "    sim = np.divide(sim, norm+10-16)\n",
    "\n",
    "    sel_term = []\n",
    "    for i in range(len(terms)):\n",
    "        sim_row = sim[i]\n",
    "        max_arg = np.argsort(sim_row, axis=0)[::-1]\n",
    "        c = 0\n",
    "\n",
    "        for e in max_arg:\n",
    "            k = DB_KEY_MAP[e]\n",
    "            t = copy.deepcopy(DB[k])\n",
    "\n",
    "            if t[\"meaning\"]:\n",
    "                t['sim'] = sim_row[e]\n",
    "                sel_term.append(t)\n",
    "                c+=1\n",
    "\n",
    "            if c>= n:\n",
    "                break\n",
    "\n",
    "    \n",
    "    sel_term = sorted(sel_term, key=lambda x:x['sim'])\n",
    "    return sel_term\n",
    "    \n",
    "\n",
    "def format_search_terms(terms):\n",
    "    txt = \"\"\n",
    "    for t in terms:\n",
    "        txt += \"{} : {}\".format(\n",
    "            \",\".join(t[\"words\"]),\n",
    "            t[\"meaning\"]\n",
    "        )\n",
    "\n",
    "        txt += \"\\n\"\n",
    "    \n",
    "    return txt\n",
    "\n",
    "def get_helpful_words(asset, conditions = None, topk=5):\n",
    "    search_terms = [asset]\n",
    "    if conditions:\n",
    "        search_terms.extend(conditions)\n",
    "\n",
    "    search_terms = get_search_terms(search_terms)\n",
    "    search_terms = search_terms[:topk]\n",
    "    search_terms = format_search_terms(search_terms)\n",
    "\n",
    "\n",
    "    return search_terms\n",
    "    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "d2987050",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Supply Relative Humidity %,Humidity,Supply Relative Humidity Setpoint %,Relative Humidity : The ratio of the amount of water vapor present in air to the amount needed for saturation at the same temperature.\n",
      "Override,override : To interrupt the action of an automatic device or system, typically to take manual control.\n",
      "Check the command from the BMS : Verify the specific command issued by the BMS.\n",
      "Reset temperature to outside conditions,Reset temperature : Adjusting the setpoint temperature based on outside conditions to optimize energy efficiency.\n",
      "Zone Temperature OR Return Temperature less than 65 F / 18.3 C : The temperature in a specific area or the temperature of the air returning to the AHU is below 65°F or 18.3°C\n",
      "\n"
     ]
    }
   ],
   "source": [
    "q = ds.questions[0]\n",
    "print(get_helpful_words(q.asset_type, q.condition_description))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "94d5898d",
   "metadata": {},
   "outputs": [],
   "source": [
    "from bench_utils.question import MultipleChoiceQuestion\n",
    "from bench_utils.inference_calls import LLMConfiguration, ModelConfig, MODEL_MAP\n",
    "\n",
    "_template = \"\"\"\n",
    "## Asset Description:\n",
    "{asset_type}: {asset_desc}\n",
    "\n",
    "## Helpful words:\n",
    "{helpful_words}\n",
    "\n",
    "## Conditions:\n",
    "{condition_str}\n",
    "\n",
    "## How long the conditions were met:\n",
    "{temporal_condition}\n",
    "\n",
    "{question_prompt}\n",
    "\"\"\"\n",
    "\n",
    "\n",
    "\n",
    "def question_templating(q:Question, desc_dict:Dict[str,str]) -> str:\n",
    "    asset_type = q.asset_type\n",
    "    asset_desc = desc_dict.get(q.asset_type, \"NONE\")\n",
    "    condition_str = \"\\n\".join(list(map(lambda x:\"- \"+x, q.condition_description)))\n",
    "    temporal_condition = q.temporal_condition[0] if len(q.temporal_condition)>0 else \"None\"\n",
    "    question_prompt = q.question_prompt\n",
    "\n",
    "    helpful_words = get_helpful_words(q.asset_type, q.condition_description)\n",
    "\n",
    "    return _template.format(\n",
    "        asset_type = asset_type,\n",
    "        asset_desc = asset_desc,\n",
    "        condition_str = condition_str,\n",
    "        temporal_condition = temporal_condition,\n",
    "        question_prompt = question_prompt,\n",
    "        helpful_words = helpful_words\n",
    "        )\n",
    "\n",
    "\n",
    "models_to_test:List[ModelConfig] = [\n",
    "    ModelConfig(**{\n",
    "        \"name\":'mistral-large',\n",
    "        \"identifier\" : 'mistralai/mistral-large',\n",
    "    }),\n",
    "    #ModelConfig(**{\n",
    "    #    \"name\":'llama-3-3-70b-instruct',\n",
    "    #    \"identifier\" : 'llama-3-3-70b-instruct',\n",
    "    #}),\n",
    " #   ModelConfig(**{\n",
    " #       \"name\":'qwen2-5-72b-instruct',\n",
    " #       'identifier':'Qwen/Qwen2.5-72B-Instruct'\n",
    " #   }),\n",
    " #   ModelConfig(**{\n",
    " #       \"name\":\"llama-3-1-405b-instruct-fp8\",\n",
    " #       \"identifier\":\"llama-3-1-405b-instruct-fp8\"\n",
    " #   }),\n",
    " #   ModelConfig(**{\n",
    " #       \"name\":\"llama-3-1-8b-instruct\",\n",
    " #       \"identifier\":\"llama-3-1-8b-instruct\"\n",
    " #   }),\n",
    " #   ModelConfig(**{\n",
    " #       \"name\":\"microsoft-phi-4\",\n",
    " #       \"identifier\":\"microsoft-phi-4\"\n",
    " #   }),\n",
    " #   ModelConfig(**{\n",
    " #       \"name\":\"mixtral-8x22b-instruct-v01\",\n",
    " #       \"identifier\":\"mixtral-8x22b-instruct-v01\"\n",
    " #   })\n",
    "    #ModelConfig(**{\n",
    "    #    \"name\":'o1',\n",
    "    #    \"identifier\" : 'openai/o1',\n",
    "    #}),\n",
    "    #ModelConfig(**{\n",
    "    #    \"name\":'o1',\n",
    "    #    \"identifier\" : 'openai/o1',\n",
    "    #})\n",
    "    ]\n",
    "\n",
    "config = {\n",
    "    \"model_to_test\": models_to_test\n",
    "}\n",
    "\n",
    "\n",
    "\n",
    "def ask_question_from_llm(q: Question, model:ModelConfig) -> dict[str,Any]:\n",
    "    #setting up prompts configs\n",
    "    q.question_first = True\n",
    "    q.text_type = \"choice\"\n",
    "    q.question = question_templating(q, ds.asset_descriptions)\n",
    "\n",
    "    mcq = MultipleChoiceQuestion()\n",
    "    mcq.load_dict(q.to_dict())\n",
    "\n",
    "    prompt = mcq.get_prompt()\n",
    "    print(prompt)\n",
    "    client = LLMConfiguration(model)\n",
    "    response =  client.get_response(prompt)\n",
    "\n",
    "    a = {\n",
    "                \"id\": q.id,\n",
    "                \"prompt\": prompt,\n",
    "                \"question_text\": mcq.question,\n",
    "                \"options_text\": mcq.options,\n",
    "                \"true_answer\": mcq.correct,\n",
    "                \"model\": model.__dict__,\n",
    "                \"model_output\": response,\n",
    "                \"model_original_output\": response,\n",
    "            }\n",
    "    \n",
    "    return a\n",
    "    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "a11f8584",
   "metadata": {},
   "outputs": [],
   "source": [
    "from models_utils.utils.concurrency import concurrent_dict_execution\n",
    "from dataset.utils import file_handle\n",
    "\n",
    "def run_bench_for_llm(llm:ModelConfig, dataset:ADIQDataset) -> dict[int, dict[str,Any]]:\n",
    "    print(\"Run Experiment for {llm}\".format(llm=llm))\n",
    "\n",
    "    param_dict = {v.id:[v, llm] for v in dataset.questions[:1]}\n",
    "    model_data = MODEL_MAP.get(llm.name)\n",
    "    results = {k:v for k,v in concurrent_dict_execution(\n",
    "            ask_question_from_llm,\n",
    "            param_dict,\n",
    "            num_max_workers=model_data.get(\"num_workers\",4)\n",
    "        )}\n",
    "    return results\n",
    "\n",
    "def run_llm_suit(ds:ADIQDataset, save_loc_data:str, llm_list=config['model_to_test']):\n",
    "    os.makedirs(save_loc_data, exist_ok=True)\n",
    "    for l in llm_list:\n",
    "        if os.path.exists(os.path.join(SAVE_LOC, f'{l.name}.json')):\n",
    "            print(\"Experiment exist for {llm}\".format(llm=l.name))\n",
    "            continue\n",
    "\n",
    "        _temp = copy.deepcopy(l.__dict__)\n",
    "        _temp[\"results\"] = run_bench_for_llm(\n",
    "            l,\n",
    "            ds,\n",
    "        )\n",
    "\n",
    "        file_handle.save_json(\n",
    "            _temp,\n",
    "            os.path.join(save_loc_data, f'{l.name}.json')\n",
    "        )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "c93b61a3",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Run Experiment for ModelConfig(name='mistral-large', identifier='mistralai/mistral-large')\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Completed::   0%|          | 0/1 [00:00<?, ?it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Please select the correct option(s) from the following options given the question:\n",
      "Question: \n",
      "## Asset Description:\n",
      "AHU: Air Handling Unit: A device used to condition and circulate air as part of a heating, ventilating, and air-conditioning (HVAC) system.\n",
      "\n",
      "## Helpful words:\n",
      "Supply Relative Humidity %,Humidity,Supply Relative Humidity Setpoint %,Relative Humidity : The ratio of the amount of water vapor present in air to the amount needed for saturation at the same temperature.\n",
      "Override,override : To interrupt the action of an automatic device or system, typically to take manual control.\n",
      "Check the command from the BMS : Verify the specific command issued by the BMS.\n",
      "Reset temperature to outside conditions,Reset temperature : Adjusting the setpoint temperature based on outside conditions to optimize energy efficiency.\n",
      "Zone Temperature OR Return Temperature less than 65 F / 18.3 C : The temperature in a specific area or the temperature of the air returning to the AHU is below 65°F or 18.3°C\n",
      "\n",
      "\n",
      "## Conditions:\n",
      "- AHU Running\n",
      "- Outside Air Damper % < 15% AND Outside Air Damper Minimum % Not  Reporting\n",
      "- Economizer Mode AND Supply Relative Humidity % Not Reporting\n",
      "- OAT < Setpoint Temperature\n",
      "- Outside Air Damper %\n",
      "- OAT > 37 °F\n",
      "- Outside Air Damper % Does NOT = Daily Average\n",
      "- SubType NOT OAU, RAS, RAU\n",
      "\n",
      "## How long the conditions were met:\n",
      "Met for 2 Hours\n",
      "\n",
      "Looking at the current state of the asset, what is the MOST likely cause among the options?\n",
      "\n",
      "Options:\n",
      "(P) Control system sent the wrong command\n",
      "(Q) Belts are loose or broken\n",
      "(S) Broken Belt\n",
      "(R) Vanes at wrong angle\n",
      "Your output must strictly follow this format:\n",
      "{\"answer\": <the list of selected options, e.g., [\"(P)\", \"(Q)\", \"(S)\", \"(R)\"]>}\n",
      "\n",
      "Your output in a single line:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Completed:: 100%|██████████| 1/1 [00:04<00:00,  4.62s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Error in 1449: name 'response' is not defined\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "run_llm_suit(ds,\"test\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "884cf098",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
