{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "the delivery rate for llama318b, is: 0.8466666666666667\n",
      "llama318b have 46 error stops. In them, 22 are dead loop due to invalid argument function call, 23 are call the function in wrong order.\n",
      "rightAccommodationSearch: 272, rightRestaurantSearch: 276, rightAttractionSearch: 294\n"
     ]
    }
   ],
   "source": [
    "import json\n",
    "#delivery rate\n",
    "def getDeliveryRate(model, numPlan):\n",
    "    delivered = 0\n",
    "    with open (f'Output/{model}/plans/toolUsePlans.jsonl','r') as f:\n",
    "         plans = [json.loads(line.strip()) for line in f]\n",
    "\n",
    "    for record in plans:\n",
    "        if record['plan'] != \"\":\n",
    "            delivered += 1\n",
    "    return delivered / numPlan\n",
    "\n",
    "#need revision to be more precise\n",
    "def getInvalidLoopAndWrongOrderRate(model):\n",
    "    allError = 0\n",
    "    invalidArgDeadLoop = 0\n",
    "    wrongOrder = 0\n",
    "\n",
    "    stoppedList = []\n",
    "    with open (f'Output/{model}/plans/toolUseLogs.jsonl','r') as f:\n",
    "        logs = [json.loads(line.strip()) for line in f]\n",
    "    for log in logs:\n",
    "        for step in reversed(log['log']):\n",
    "            if step['state'] != 'Successful':\n",
    "                #print(log['index'], step['step'],step['state'], step['action'])\n",
    "                if step['state'] == 'same action 3 times repeated':\n",
    "                    allError += 1\n",
    "                    stoppedList.append([log['index'],step['step']])\n",
    "\n",
    "    for stop in stoppedList:\n",
    "        plan = stop[0] - 1\n",
    "        index = stop[1] - 2\n",
    "\n",
    "        if logs[plan]['log'][index]['state'] == 'Illegal args. Parameter Error':\n",
    "            invalidArgDeadLoop += 1\n",
    "        elif logs[plan]['log'][index]['state'] == 'Illegal args. Other Error':\n",
    "            wrongOrder += 1\n",
    "        else:\n",
    "            continue\n",
    "\n",
    "\n",
    "    #print(stoppedList)\n",
    "    return allError, invalidArgDeadLoop, wrongOrder\n",
    "\n",
    "def getRightFunctionCall(model):\n",
    "    rightRestaurantSearch = 0\n",
    "    rightAccommodationSearch = 0\n",
    "    rightAttractionSearch = 0\n",
    "    with open (f'Output/{model}/plans/toolUseLogs.jsonl','r') as f:\n",
    "        logs = [json.loads(line.strip()) for line in f]\n",
    "    for log in logs:\n",
    "        for step in reversed(log['log']):\n",
    "            if step['state'] == 'Successful':\n",
    "                if 'Accommodation' in step['action']:\n",
    "                     rightAccommodationSearch += 1\n",
    "                     break\n",
    "        \n",
    "        for step in reversed(log['log']):\n",
    "            if step['state'] == 'Successful':\n",
    "                if 'Restaurant' in step['action']:\n",
    "                     rightRestaurantSearch += 1\n",
    "                     break\n",
    "        \n",
    "        for step in reversed(log['log']):\n",
    "            if step['state'] == 'Successful':\n",
    "                if 'Attraction' in step['action']:\n",
    "                     rightAttractionSearch += 1\n",
    "                     break\n",
    "    \n",
    "    return rightAccommodationSearch, rightRestaurantSearch, rightAttractionSearch\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    model = 'llama318b'\n",
    "    deliverayRate = getDeliveryRate('llama318b',300)\n",
    "    print(f\"the delivery rate for {model}, is:\" ,deliverayRate)\n",
    "\n",
    "    allError,invalidArgDeadLoop,wrongOrder = getInvalidLoopAndWrongOrderRate(model)\n",
    "    print(f\"{model} have {allError} error stops. In them, {invalidArgDeadLoop} are dead loop due to invalid argument function call, {wrongOrder} are call the function in wrong order.\")\n",
    "\n",
    "    acco, res, right = getRightFunctionCall(model)\n",
    "    print(f\"rightAccommodationSearch: {acco}, rightRestaurantSearch: {res}, rightAttractionSearch: {right}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "torchgpu",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
