{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "==Model:  gpt4o ==\n",
      "==Task:  filteredDataRouteOP ==\n",
      "[0.32, 0.0, 0.0, 0.017142857142857144, 0.0, 0.49714285714285716, 0.1657142857142857, 0.0]\n"
     ]
    }
   ],
   "source": [
    "#Analysis the error parameter rate of GPT-4o\n",
    "import json\n",
    "from fuzzywuzzy import fuzz\n",
    "import numpy as np\n",
    "import sys\n",
    "import os\n",
    "import json\n",
    "import re\n",
    "\n",
    "def getID(name,address,category):\n",
    "    #as long as there is a '-', then return -2\n",
    "    #if there is an empty list, then return []\n",
    "    #if the information doesn't match, return -1\n",
    "\n",
    "    if name == \"-\" and address == \"-\":\n",
    "        return -2\n",
    "\n",
    "    #normal case\n",
    "    idFromName = []\n",
    "    idFromAddress = []\n",
    "\n",
    "    address = address.split(\",\")[0]\n",
    "    \n",
    "    #restaurants\n",
    "    if category == 'restaurants':\n",
    "        for restaurant in restaurants:\n",
    "            if restaurant['name'].lower() == name.lower():\n",
    "                idFromName.append(restaurant['business_id'])\n",
    "            if restaurant['address'].lower() == address.lower():\n",
    "                idFromAddress.append(restaurant['business_id'])\n",
    "        set1 = set(idFromName)\n",
    "        set2 = set(idFromAddress)\n",
    "        #if the extracted id from name and address make an agreement\n",
    "        if(len(set1 & set2) == 1):\n",
    "            return list(set1 & set2)[0]\n",
    "        # if not, we have to use similarity score to determine the id\n",
    "        else:\n",
    "            name_sim_score = []\n",
    "            address_sim_score = []\n",
    "\n",
    "            for restaurant in restaurants:\n",
    "                name_sim_score.append(fuzz.ratio(name.lower(), restaurant['name'].lower()))\n",
    "                address_sim_score.append(fuzz.ratio(address.lower(), restaurant['address'].lower()))\n",
    "\n",
    "            scores = np.array(name_sim_score) + np.array(address_sim_score)\n",
    "            #if the score is high enough, then we claim the id\n",
    "            if max(scores) >= 120:\n",
    "                return restaurants[np.argmax(scores)]['business_id']\n",
    "            #if the score is less than 60 for each, then we indicate that the business is out of the pool\n",
    "            else:\n",
    "                return -1\n",
    "    #attractions \n",
    "    if category == 'attractions':\n",
    "        for attraction in attractions:\n",
    "            if attraction['name'].lower() == name.lower():\n",
    "                idFromName.append(attraction['business_id'])\n",
    "            if attraction['address'].lower() == address.lower():\n",
    "                idFromAddress.append(attraction['business_id'])\n",
    "        \n",
    "        set1 = set(idFromName)\n",
    "        set2 = set(idFromAddress)\n",
    "\n",
    "        if(len(set1 & set2) == 1):\n",
    "            return list(set1 & set2)[0]\n",
    "        else:\n",
    "            name_sim_score = []\n",
    "            address_sim_score = []\n",
    "\n",
    "            for attraction in attractions:\n",
    "                name_sim_score.append(fuzz.ratio(name.lower(), attraction['name'].lower()))\n",
    "                address_sim_score.append(fuzz.ratio(address.lower(), attraction['address'].lower()))\n",
    "\n",
    "            if max(name_sim_score) == 100:\n",
    "                return attractions[np.argmax(name_sim_score)]['business_id']\n",
    "\n",
    "            scores = np.array(name_sim_score) + np.array(address_sim_score)\n",
    "            if max(scores) >= 120:\n",
    "                return attractions[np.argmax(scores)]['business_id']\n",
    "            else:\n",
    "                return -1\n",
    "    #hotels\n",
    "    if category == 'hotels':\n",
    "        for hotel in hotels:\n",
    "            if hotel['name'].lower() == name.lower():\n",
    "                idFromName.append(hotel['business_id'])\n",
    "            if hotel['address'].lower() == address.lower():\n",
    "                idFromAddress.append(hotel['business_id'])\n",
    "        set1 = set(idFromName)\n",
    "        set2 = set(idFromAddress)\n",
    "        if(len(set1 & set2) == 1):\n",
    "            return list(set1 & set2)[0]\n",
    "        else:\n",
    "            name_sim_score = []\n",
    "            address_sim_score = []\n",
    "\n",
    "            for hotel in hotels:\n",
    "                name_sim_score.append(fuzz.ratio(name.lower(), hotel['name'].lower()))\n",
    "                address_sim_score.append(fuzz.ratio(address.lower(), hotel['address'].lower()))\n",
    "\n",
    "            scores = np.array(name_sim_score) + np.array(address_sim_score)\n",
    "            if max(scores) >= 120:\n",
    "                return hotels[np.argmax(scores)]['business_id']\n",
    "            else:\n",
    "                return -1\n",
    "\n",
    "def prepareEval(plan):\n",
    "    plan_eval = []\n",
    "    for days in plan['itinerary']:\n",
    "        day = {}\n",
    "        day['days'] = days['days']\n",
    "        #print(days['breakfast']['name'])\n",
    "        day['breakfast'] = getID(days['breakfast']['name'],days['breakfast']['address'],'restaurants')\n",
    "        day['morning_attractions'] = [getID(attraction['name'],attraction['address'],'attractions') for attraction in days['morning_attractions']]\n",
    "        day['lunch'] = getID(days['lunch']['name'],days['lunch']['address'],'restaurants')\n",
    "        day['afternoon_attractions'] = [getID(attraction['name'],attraction['address'],'attractions') for attraction in days['afternoon_attractions']]\n",
    "        day['dinner'] = getID(days['dinner']['name'],days['dinner']['address'],'restaurants')\n",
    "        day['night_attractions'] = [getID(attraction['name'],attraction['address'],'attractions') for attraction in days['night_attractions']]\n",
    "        day['accommodation'] = getID(days['accommodation']['name'],days['accommodation']['address'],'hotels')\n",
    "        plan_eval.append(day)\n",
    "    #print(plan_eval)\n",
    "    return plan_eval\n",
    "\n",
    "def evaluate_outSidePool(plan_eval):\n",
    "    for day in plan_eval:\n",
    "        for key,value in day.items():\n",
    "            if isinstance(value, list):\n",
    "                for id in value:\n",
    "                    if id == -1:\n",
    "                        return 1\n",
    "            else:\n",
    "                if value == -1:\n",
    "                    return 1\n",
    "    return 0\n",
    "\n",
    "def evaluate_missingInfo(plan_eval):\n",
    "    for day in plan_eval:\n",
    "        for key,value in day.items():\n",
    "            #night attraction can be skipped\n",
    "            if key == 'night_attractions':\n",
    "                continue\n",
    "\n",
    "            if isinstance(value, list):\n",
    "\n",
    "                if(len(value) == 0):\n",
    "                        return 1\n",
    "                else:\n",
    "                    for val in value:\n",
    "                        if val == -2:\n",
    "                            return 1\n",
    "            else:\n",
    "                if value == -2:\n",
    "                    return 1\n",
    "\n",
    "    return 0\n",
    "\n",
    "def evaluate_day(plan_eval,eval):\n",
    "    day_numerator = 0\n",
    "    day_denominator = 1\n",
    "\n",
    "    if(len(plan_eval) == int(eval['day'][0][0])):\n",
    "        day_numerator = 1\n",
    "    return day_numerator, day_denominator\n",
    "\n",
    "def evaluate_price(plan_eval,eval):\n",
    "    price_numerator = 0\n",
    "    price_denominator = 0\n",
    "\n",
    "    price_map = {'cheap budget':['$','$$'],'moderate budget':['$','$$','$$$'],'expensive budget':['$$','$$$','$$$$']}\n",
    "    price_limit = price_map[eval['price'][0]]\n",
    "\n",
    "    #price - meals\n",
    "    all_meals = []\n",
    "    for day in plan_eval:\n",
    "        all_meals.append(day['breakfast'])\n",
    "        all_meals.append(day['lunch'])\n",
    "        all_meals.append(day['dinner'])\n",
    "    price_denominator += len(all_meals)\n",
    "\n",
    "    for restaurant_id in all_meals:\n",
    "        if restaurant_id != -1 and restaurant_id != -2:\n",
    "            for restaurant in restaurants:\n",
    "                if(restaurant['business_id'] == restaurant_id):\n",
    "                    if(restaurant['price'] in price_limit):\n",
    "                        price_numerator += 1\n",
    "\n",
    "\n",
    "    #price hotel\n",
    "    for day in plan_eval:\n",
    "        hotel_id = day['accommodation']\n",
    "        if hotel_id != -1 and hotel_id != -2:\n",
    "            price_denominator += 1\n",
    "            for hotel in hotels:\n",
    "                if(hotel['business_id'] == hotel_id):\n",
    "                    if(hotel['price'] in price_limit):\n",
    "                        price_numerator += 1\n",
    "    \n",
    "\n",
    "\n",
    "    #price - attractions\n",
    "    all_attractions = []\n",
    "    for day in plan_eval:\n",
    "        for id in day['morning_attractions']:\n",
    "            all_attractions.append(id)\n",
    "        for id in day['afternoon_attractions']:\n",
    "            all_attractions.append(id)\n",
    "        for id in day['night_attractions']:\n",
    "            all_attractions.append(id)\n",
    "    price_denominator += len(all_attractions)\n",
    "\n",
    "    for attraction_id in all_attractions:\n",
    "        if attraction_id != -1 and attraction_id != -2:\n",
    "            for attraction in attractions:\n",
    "                if(attraction['business_id'] == attraction_id):\n",
    "                    if(attraction['price'] in price_limit):\n",
    "                        price_numerator += 1\n",
    "\n",
    "\n",
    "    return price_numerator, price_denominator\n",
    "\n",
    "def evaluate_attraction_orientation(plan_eval,eval):\n",
    "    #attraction orientation\n",
    "    orientation_numerator = 0\n",
    "    orientation_denominator = 0\n",
    "\n",
    "    oritentation_limit = eval['attraction'][0]\n",
    "    oritentation_category = oritentation_limit\n",
    "    oritentation_acceptable_list = ['medium ' + oritentation_limit, 'high ' + oritentation_limit]\n",
    "    #print(oritentation_acceptable_list)\n",
    "    all_attractions = []\n",
    "    for day in plan_eval:\n",
    "        for id in day['morning_attractions']:\n",
    "            all_attractions.append(id)\n",
    "        for id in day['afternoon_attractions']:\n",
    "            all_attractions.append(id)\n",
    "        for id in day['night_attractions']:\n",
    "            all_attractions.append(id)\n",
    "    orientation_denominator += len(all_attractions)\n",
    "    for attraction_id in all_attractions:\n",
    "        if attraction_id != -1 and attraction_id != -2:\n",
    "            for attraction in attractions:\n",
    "                if(attraction['business_id'] == attraction_id):\n",
    "                    if attraction[oritentation_category] in oritentation_acceptable_list:\n",
    "                        #print(\"attraction orientation is acceptable which is: \", attraction[oritentation_category])\n",
    "                        orientation_numerator += 1\n",
    "                        \n",
    "    return orientation_numerator,orientation_denominator\n",
    "                    #else:\n",
    "                        #print(\"attraction orientation is not acceptable which is: \", attraction[oritentation_category])\n",
    "\n",
    "def evaluate_cuisine(plan_eval,eval):\n",
    "    #cuisine\n",
    "    cuisine_numerator = 0\n",
    "    cuisine_denominator = 0\n",
    "    cuisine_satisfied = False\n",
    "\n",
    "    cuisine_limit = [eval['cuisine'][0]]\n",
    "    #print(cuisine_limit)\n",
    "    if cuisine_limit == ['US']:\n",
    "        cuisine_limit = ['American','American (New)','American (Traditional)']\n",
    "\n",
    "    #at least we have one restaurant that match the cuisin, we will turn it to true\n",
    "    all_meals = []\n",
    "    for day in plan_eval:\n",
    "        all_meals.append(day['breakfast'])\n",
    "        all_meals.append(day['lunch'])\n",
    "        all_meals.append(day['dinner'])\n",
    "    cuisine_denominator += len(all_meals)\n",
    "    #print(cuisine_denominator)\n",
    "\n",
    "    for restaurant_id in all_meals:\n",
    "        if restaurant_id != -1 and restaurant_id != -2:\n",
    "            for restaurant in restaurants:\n",
    "                if(restaurant['business_id'] == restaurant_id):\n",
    "                    cuisine_provided = []\n",
    "                    cuisine_provided.append(restaurant['cuisine_1'])\n",
    "                    cuisine_provided.append(restaurant['cuisine_2'])\n",
    "                    #print(restaurant_id)\n",
    "                    #print((set(cuisine_provided))) \n",
    "                    if(len(list(set(cuisine_limit) & set(cuisine_provided))) > 0):\n",
    "                        cuisine_numerator += 1\n",
    "    #print(list(set(cuisine_limit)))\n",
    "    \n",
    "    return cuisine_numerator, cuisine_denominator\n",
    "\n",
    "def evaluate_restaurants(plan_eval,eval):\n",
    "    #restaurant \n",
    "    restaurants_numerator = 0\n",
    "    restaurants_denominator = 0\n",
    "\n",
    "    restaurants_limits = eval['restaurant']\n",
    "    restaurants_category = [cat[5:] for cat in restaurants_limits]\n",
    "\n",
    "\n",
    "\n",
    "    all_meals = []\n",
    "    for day in plan_eval:\n",
    "        all_meals.append(day['breakfast'])\n",
    "        all_meals.append(day['lunch'])\n",
    "        all_meals.append(day['dinner'])\n",
    "    restaurants_denominator += len(all_meals)\n",
    "    restaurants_denominator = restaurants_denominator * len(restaurants_category)\n",
    "\n",
    "    for cat in restaurants_category:\n",
    "        find_not_satisfication = False\n",
    "        restaurants_acceptable_list = []\n",
    "        restaurants_acceptable_list.append('good ' + cat)\n",
    "        restaurants_acceptable_list.append('excellent ' + cat)\n",
    "\n",
    "        for restaurant_id in all_meals: \n",
    "            if restaurant_id != -1 and restaurant_id != -2:\n",
    "                for restaurant in restaurants:\n",
    "                    if(restaurant['business_id'] == restaurant_id):\n",
    "                        if(restaurant[cat] in restaurants_acceptable_list):\n",
    "                            restaurants_numerator += 1\n",
    "    return restaurants_numerator, restaurants_denominator\n",
    "\n",
    "def evaluate_hotels(plan_eval,eval):\n",
    "    #Hotel\n",
    "\n",
    "    hotel_numerator = 0\n",
    "    hotel_denominator = 0\n",
    "    \n",
    "\n",
    "    hotel_limit = eval['hotel']\n",
    "    hotel_cat = [cat[5:] for cat in hotel_limit]\n",
    "\n",
    "    all_hotels = []\n",
    "    for day in plan_eval:\n",
    "        hotel_id = day['accommodation']\n",
    "        all_hotels.append(hotel_id)\n",
    "    hotel_denominator += len(all_hotels)\n",
    "    hotel_denominator *= len(hotel_cat)\n",
    "\n",
    "    for cat in hotel_cat:\n",
    "        find_not_satisfied = False\n",
    "        hotel_acceptable_list = []\n",
    "        hotel_acceptable_list.append('good ' + cat)\n",
    "        hotel_acceptable_list.append('excellent ' + cat)\n",
    "\n",
    "        for hotel_id in all_hotels:\n",
    "            if hotel_id != -1 and hotel_id != -2:\n",
    "                for hotel in hotels:\n",
    "                    if(hotel['business_id'] == hotel_id):    \n",
    "                        if(hotel[cat] in hotel_acceptable_list):\n",
    "                            hotel_numerator += 1\n",
    "    \n",
    "\n",
    "\n",
    "    #note: only for hotel, we need to consider what if no recommendation, which means\n",
    "    # all -2, we don't consider this in other categories since there is low chance that\n",
    "    #llm didn't provide any reccommendation for food or attractions. \n",
    "    if(all(x == -2 for x in all_hotels)):\n",
    "        hotel_numerator= 0 \n",
    "        hotel_denominator = 0\n",
    "\n",
    "    return hotel_numerator, hotel_denominator\n",
    "\n",
    "def getFailure(failure_list):\n",
    "    failure = [sum(x) for x in zip(*failure_list)]\n",
    "    failure = [(x/len(failure_list)) for x in failure]\n",
    "    return failure\n",
    "\n",
    "def getMicro(preference_list):    \n",
    "    micro = np.array([0,0])\n",
    "    for record in preference_list:\n",
    "        for cat in record:\n",
    "            micro += np.array(cat)\n",
    "    #print(micro)\n",
    "    return micro[0]/micro[1]\n",
    "\n",
    "def getMacro(preference_list):    \n",
    "    numerator = []\n",
    "    denomminator = len(preference_list)\n",
    "    for record in preference_list:\n",
    "        each =  [sum(x) for x in zip(*record)]\n",
    "        numerator.append(1 if each[0] == each[1] else 0)\n",
    "    #print(numerator, denomminator)\n",
    "    return sum(numerator)/denomminator\n",
    "\n",
    "def getNewMacro(preference_list, passrate):\n",
    "    numerator = 0\n",
    "    denominator = len(preference_list)\n",
    "\n",
    "    for plan in preference_list:\n",
    "        passedPlan = True\n",
    "        for day in plan:\n",
    "            if day[0] == day[1] == 0:\n",
    "                continue\n",
    "            if (day[0] / day[1]) < passrate:\n",
    "                passedPlan = False\n",
    "                break\n",
    "        if passedPlan:\n",
    "            numerator += 1\n",
    "    #print(numerator, denominator)\n",
    "    return numerator/denominator\n",
    "\n",
    "def getFailureAndPreferenceList(model,task,planIndex):\n",
    "    failure_list = []\n",
    "    preference_list = []\n",
    "    \n",
    "    with open(f'Output/{model}/evals/{task}.jsonl', 'r') as f:\n",
    "        plans = [json.loads(line) for line in f]\n",
    "\n",
    "    with open(f'Prompts/evals.jsonl', 'r') as f:\n",
    "            evals = [json.loads(line) for line in f]\n",
    "\n",
    "    plan = plans[planIndex]['plan']\n",
    "    eval = evals[planIndex]['eval_info']\n",
    "    \n",
    "    # Failure rate related\n",
    "    # prepare a result list to return\n",
    "    # outofpool, missinginfo,\n",
    "    results = []\n",
    "    # prepare the evaluation for each plan, search the business id\n",
    "    plan_eval = prepareEval(plan)\n",
    "    #print(plan_eval)\n",
    "\n",
    "    outsidepool = evaluate_outSidePool(plan_eval)\n",
    "    results.append(outsidepool)\n",
    "\n",
    "\n",
    "    missingInfo = evaluate_missingInfo(plan_eval)\n",
    "    results.append(missingInfo)\n",
    "    #print(results)\n",
    "\n",
    "    failure_list.append(results)\n",
    "\n",
    "    # preference recall related\n",
    "    \n",
    "    results = []\n",
    "\n",
    "    #day\n",
    "    day_numerator, day_denominator = evaluate_day(plan_eval,eval)\n",
    "    results.append([day_numerator, day_denominator])\n",
    "\n",
    "    #price\n",
    "    price_numerator, price_denominator = evaluate_price(plan_eval,eval)\n",
    "    results.append([price_numerator, price_denominator])\n",
    "\n",
    "    #attraction orientation\n",
    "    attraction_numerator, attraction_denominator = evaluate_attraction_orientation(plan_eval,eval)\n",
    "    results.append([attraction_numerator, attraction_denominator])\n",
    "    \n",
    "    #cuisine\n",
    "    cuisine_numerator, cuisine_denominator = evaluate_cuisine(plan_eval,eval)\n",
    "    results.append([cuisine_numerator, cuisine_denominator])\n",
    "\n",
    "    #restaurants\n",
    "    restaurants_numerator, restaurants_denominator = evaluate_restaurants(plan_eval,eval)\n",
    "    results.append([restaurants_numerator, restaurants_denominator])\n",
    "\n",
    "    #hotels\n",
    "    hotels_numerator, hotels_denominator = evaluate_hotels(plan_eval,eval)\n",
    "    results.append([hotels_numerator, hotels_denominator])\n",
    "\n",
    "    preference_list.append(results)\n",
    "    #print(preference_list)\n",
    "    return failure_list, preference_list\n",
    "\n",
    "def populateCordinates(plan_eval, data, data_hotel):\n",
    "    cordinates = []\n",
    "    for day in plan_eval:\n",
    "        cordinate_one_day = []\n",
    "\n",
    "        #if the hotel is invalid, we skip the day\n",
    "        if(day['accommodation'] == -1 or day['accommodation'] == -2):\n",
    "            continue\n",
    "\n",
    "        if(day['accommodation'] != -1):\n",
    "            cordinate_one_day.append(getCordinate_Hotel(day['accommodation'], data_hotel))\n",
    "        \n",
    "        for attraction in day['morning_attractions']:\n",
    "            if(attraction != -1):\n",
    "                cordinate_one_day.append(getCordinate(attraction,data))\n",
    "        for attraction in day['afternoon_attractions']:\n",
    "            if(attraction != -1):\n",
    "                cordinate_one_day.append(getCordinate(attraction,data))\n",
    "        for attraction in day['night_attractions']:\n",
    "            if(attraction != -1):\n",
    "                cordinate_one_day.append(getCordinate(attraction,data))\n",
    "                \n",
    "        cordinates.append(cordinate_one_day)\n",
    "    return cordinates\n",
    "\n",
    "def getCordinate(id,data):\n",
    "    for attraction in data:\n",
    "        if attraction['business_id'] == id:\n",
    "            return (attraction['latitude'], attraction['longitude'])\n",
    "\n",
    "def getCordinate_Hotel(id,data_hotel):\n",
    "    for hotel in data_hotel:\n",
    "        if hotel['business_id'] == id:\n",
    "            return (hotel['latitude'], hotel['longitude'])\n",
    "        \n",
    "def getDistanceMatrix(cordinates):\n",
    "    #print(cordinates)\n",
    "    n = len(cordinates)\n",
    "    distance_matrix = np.zeros((n, n))\n",
    "    for i in range(n):\n",
    "        for j in range(i+1, n):\n",
    "            distance_matrix[i][j] = distance_matrix[j][i] = ((cordinates[i][0]*1000 - cordinates[j][0]*1000)**2 + (cordinates[i][1]*1000 - cordinates[j][1]*1000)**2)**0.5\n",
    "    return distance_matrix\n",
    "\n",
    "def populateShortestDistanceOneDay(cordinates):\n",
    "    shortest_distance_list = []\n",
    "    shortest_distance_info_lists = []\n",
    "    for oneday in cordinates:\n",
    "        distance_matrix = getDistanceMatrix(oneday)\n",
    "        n = len(distance_matrix)\n",
    "        info_lists = []\n",
    "        optimized_distance = totalCost(1, 0, n, distance_matrix,info_lists)\n",
    "        shortest_distance_list.append(optimized_distance)\n",
    "        shortest_distance_info_lists.append(info_lists)\n",
    "    return shortest_distance_list, shortest_distance_info_lists\n",
    "\n",
    "def totalCost(mask, pos, n, cost, info_lists):\n",
    "    distance_list = []\n",
    "    i_list = []\n",
    "    # Base case: if all cities are visited, return the\n",
    "    # cost to return to the starting city (0)\n",
    "    if mask == (1 << n) - 1:\n",
    "        return cost[pos][0]\n",
    "\n",
    "    ans = sys.maxsize   \n",
    "\n",
    "    # Try visiting every city that has not been visited yet\n",
    "    for i in range(n):\n",
    "        if (mask & (1 << i)) == 0: \n",
    "            i_list.append(i)\n",
    "            # If city i is not visited, visit it and \n",
    "            #  update the mask\n",
    "            distance_list.append(cost[pos][i] +\n",
    "                      totalCost(mask | (1 << i), i, n, cost, info_lists))\n",
    "        \n",
    "\n",
    "    info_list = [pos,i_list, distance_list]\n",
    "    info_lists.append(info_list)\n",
    "    \n",
    "    ans = min(distance_list)\n",
    "    return ans\n",
    "\n",
    "def populatePlannedDistanceOneDay(cordinates):\n",
    "    planned_distance_list = []\n",
    "    for oneday in cordinates:\n",
    "        distance_matrix = getDistanceMatrix(oneday)\n",
    "        #print(distance_matrix)\n",
    "        distance = 0\n",
    "        for i in range(len(distance_matrix)):\n",
    "            if i == len(distance_matrix) - 1:\n",
    "                j = 0\n",
    "            else:\n",
    "                j = i + 1\n",
    "            distance += distance_matrix[i][j]\n",
    "        planned_distance_list.append(distance)\n",
    "    return planned_distance_list\n",
    "\n",
    "def getDistanceGapRatio(shortest_distances_by_day, planned_distances_by_day):\n",
    "    distance_gap = 0\n",
    "    total_distance = 0\n",
    "    for optimized_distance, planned_distance in zip(shortest_distances_by_day, planned_distances_by_day):\n",
    "        gap = []\n",
    "        gap = np.sum(np.array(planned_distance) - np.array(optimized_distance))\n",
    "        distance_gap += gap\n",
    "        \n",
    "        total = np.sum(np.array(planned_distance))\n",
    "        total_distance += total\n",
    "        \n",
    "    return distance_gap / total_distance\n",
    "\n",
    "def getOptimizedOrder(shortest_distance_info_lists):\n",
    "\n",
    "\n",
    "    order_list = []\n",
    "    for day in shortest_distance_info_lists:\n",
    "\n",
    "        if len(day) == 0:\n",
    "            order_list.append([[0],[0]])\n",
    "            continue\n",
    "\n",
    "        pos = 0\n",
    "        n = len(day[-1][1]) + 1\n",
    "        #get a list of 1 to n\n",
    "        candidates = list(range(n-1))\n",
    "        #add 1 to the values\n",
    "        candidates = [x+1 for x in candidates]\n",
    "\n",
    "        moves = []\n",
    "\n",
    "        while len(candidates) > 0:\n",
    "            #find the last one in the lnfo_list\n",
    "            for i in range(len(day)):\n",
    "                if day[i][0] == pos and day[i][1] == candidates:\n",
    "                    #print(day[i][0],day[i][1])\n",
    "                    next_move = day[i][1][np.argmin(day[i][2])]\n",
    "                    #print(next_move)\n",
    "                    pos = next_move\n",
    "                    moves.append(next_move)\n",
    "                    #take next move out of candidates\n",
    "                    candidates.remove(next_move)\n",
    "\n",
    "        moves_reversed = moves[::-1]\n",
    "        optimized_route = [[0] + moves, [0] + moves_reversed]\n",
    "        order_list.append(optimized_route)\n",
    "\n",
    "    return order_list\n",
    "        \n",
    "def getPositionDeviationRatio(shortest_order_by_day):\n",
    "    total_places = 0\n",
    "    total_deviation = 0\n",
    "    for plan in shortest_order_by_day:\n",
    "        for day in plan:\n",
    "            n = len(day[0])\n",
    "            total_places += n\n",
    "            output_route = list(range(n))\n",
    "            gap_1 = sum([1 if x != y else 0 for x,y in zip(output_route,day[0])])\n",
    "            gap_2 = sum([1 if x != y else 0 for x,y in zip(output_route,day[1])])\n",
    "            total_deviation += min(gap_1, gap_2)\n",
    "    return total_deviation / total_places\n",
    "\n",
    "def daywiseTSP(model,task, numPlan):\n",
    "    shortest_distances_by_day = []\n",
    "    planned_distances_by_day = []\n",
    "    shortest_order_by_day = []\n",
    "\n",
    "    with open(f'Output/{model}/evals/{task}.jsonl', 'r') as f:\n",
    "        plans = [json.loads(line) for line in f]\n",
    "    for i in range(numPlan):\n",
    "        if (i%20 == 0):\n",
    "            print(\"Mode: day wise. We are at plan \", i)\n",
    "        plan = plans[i]['plan'] \n",
    "        \n",
    "        # Failure rate related\n",
    "        # prepare a result list to return\n",
    "        # outofpool, missinginfo,\n",
    "        # prepare the evaluation for each plan, search the business id\n",
    "        plan_eval = prepareEval(plan)\n",
    "        #print(plan_eval)\n",
    "\n",
    "        #get the cordinates\n",
    "        cordinates = populateCordinates(plan_eval, attractions, hotels)\n",
    "        #print(cordinates)\n",
    "        #one day shortest distance\n",
    "        shortest_distance_list_each_day, shortest_distance_info_lists = populateShortestDistanceOneDay(cordinates)\n",
    "        #print(shortest_distance_info_lists)\n",
    "        shortest_distances_by_day.append(shortest_distance_list_each_day)\n",
    "        \n",
    "        shortest_order_list_each_day = getOptimizedOrder(shortest_distance_info_lists)\n",
    "        \n",
    "        shortest_order_by_day.append(shortest_order_list_each_day)\n",
    "        #shortest_order_by_day(info_list)\n",
    "        \n",
    "        #one day planned distance\n",
    "        planned_distance_list_each_day = populatePlannedDistanceOneDay(cordinates)\n",
    "        planned_distances_by_day.append(planned_distance_list_each_day)\n",
    "\n",
    "        #plan wise (multi day) optimization calculation\n",
    "\n",
    "    #get distance gap ratio\n",
    "    distance_gap_ratio = getDistanceGapRatio(shortest_distances_by_day, planned_distances_by_day)\n",
    "\n",
    "    #position deviation ratio\n",
    "    position_deviation_ratio = getPositionDeviationRatio(shortest_order_by_day)\n",
    "    \n",
    "    return distance_gap_ratio, position_deviation_ratio\n",
    "\n",
    "def getHotelIndex(day,cordinates):\n",
    "    hotel_index = 0\n",
    "    if day > 0:\n",
    "        for j in range(day):\n",
    "            hotel_index += len(cordinates[j])\n",
    "    return hotel_index\n",
    "\n",
    "def totalCost_multiday(mask, pos, day, cordinates, n, visited, cost, info_lists, memo):\n",
    "    visit_requirement = len(cordinates[day])\n",
    "    distance_list = []\n",
    "    i_list = []\n",
    "\n",
    "    hotel_index = getHotelIndex(day,cordinates)\n",
    "    # Base case: if all cities are visited, return the\n",
    "    # cost to return to the starting city (0)\n",
    "\n",
    "    if mask == (1 << n) - 1:\n",
    "        return cost[pos][hotel_index]\n",
    "    \n",
    "    if memo[pos][mask] != -1:\n",
    "        return memo[pos][mask]\n",
    "\n",
    "    if visit_requirement == visited:\n",
    "        for i in range(n):\n",
    "            if (mask & (1 << i)) == 0: \n",
    "                i_list.append(i)\n",
    "                distance_list.append(cost[hotel_index][i] + totalCost_multiday(mask | (1 << i), i, day + 1, cordinates, n, 2, cost, info_lists,memo))\n",
    "        \n",
    "        info_list = [pos,i_list, distance_list]\n",
    "        info_lists.append(info_list)\n",
    "        \n",
    "        return min(distance_list) + cost[pos][hotel_index] # change this to the old hotel position\n",
    "    \n",
    "    # Try visiting every city that has not been visited yet\n",
    "    for i in range(n):\n",
    "        if (mask & (1 << i)) == 0: \n",
    "\n",
    "            i_list.append(i)\n",
    "            # If city i is not visited, visit it and \n",
    "             #  update the mask\n",
    "            distance_list.append(cost[pos][i] +\n",
    "                      totalCost_multiday(mask | (1 << i), i, day, cordinates, n, visited + 1, cost, info_lists,memo))\n",
    "        \n",
    "\n",
    "    info_list = [pos,i_list, distance_list]\n",
    "    info_lists.append(info_list)\n",
    "    \n",
    "    memo[pos][mask] = min(distance_list)\n",
    "\n",
    "    return min(distance_list)\n",
    "\n",
    "def getDistanceMatrix_by_plan(cordinates):\n",
    "    #print(cordinates)\n",
    "    n = 0\n",
    "    for day in cordinates:\n",
    "        for place in day:\n",
    "            n+=1\n",
    "    flattened = []\n",
    "    for day in cordinates:\n",
    "        for location in day:\n",
    "            flattened.append(location)\n",
    "    distance_matrix = np.zeros((n, n))\n",
    "    for i in range(n):\n",
    "        for j in range(i+1, n):\n",
    "            distance_matrix[i][j] = distance_matrix[j][i] = ((flattened[i][0]*1000 - flattened[j][0]*1000)**2 + (flattened[i][1]*1000 - flattened[j][1]*1000)**2)**0.5\n",
    "    return distance_matrix\n",
    "\n",
    "def getOptimizedDistance_by_plan(cordinates,distance_matrix):\n",
    "    n = len(distance_matrix)\n",
    "    info_lists = []\n",
    "    #newMask will have all the hotels as 1 before the function.\n",
    "    newMask = 1\n",
    "    index_list = list(range(len(cordinates) - 1))\n",
    "    index_list = index_list[::-1]\n",
    "    newMask = 1\n",
    "    for i in index_list:\n",
    "        newMask = (newMask << (len(cordinates[i]))) + 1\n",
    "    memo = [[-1] * (1 << n) for _ in range(n)]\n",
    "    optimized_distance = totalCost_multiday(newMask,0,0,cordinates,n,1,distance_matrix, info_lists,memo)\n",
    "    return optimized_distance, info_lists\n",
    "\n",
    "def getOptimizedOrder_by_plan(info_lists):\n",
    "    pos = 0\n",
    "    lookfor = info_lists[-1][1].copy()\n",
    "    moves = []\n",
    "    while len(lookfor) > 0:\n",
    "        for record in info_lists:\n",
    "            if(record[0] == pos and record[1] == lookfor):\n",
    "                nextmove = record[1][np.argmin(record[2])]\n",
    "                pos = nextmove\n",
    "                moves.append(nextmove)\n",
    "                lookfor.remove(pos)\n",
    "    return moves\n",
    "\n",
    "def getPlannedDistance_by_plan(cordinates, distance_matrix):\n",
    "    distance = 0\n",
    "    for i in range(len(distance_matrix)):\n",
    "        if i == len(distance_matrix) - 1:\n",
    "            j = len(distance_matrix) - len(cordinates[-1])\n",
    "        else:\n",
    "            j = i + 1\n",
    "        distance += distance_matrix[i][j]\n",
    "    return distance\n",
    "\n",
    "def getDistanceGapRatio_by_plan(optimized_distances_by_plan, planned_distances_by_plan):\n",
    "    gaps = np.array([])\n",
    "    for optimized,planned in zip(optimized_distances_by_plan,planned_distances_by_plan):\n",
    "        gap = planned - optimized\n",
    "        gaps = np.append(gaps,gap)\n",
    "    total_gap = np.sum(gaps)\n",
    "    total_planned = np.sum(planned_distances_by_plan)\n",
    "    ratio = total_gap / total_planned\n",
    "    return ratio\n",
    "\n",
    "def getDistanceGapRatio_by_plan(optimized_distances_by_plan, planned_distances_by_plan):\n",
    "    gaps = np.array([])\n",
    "    for optimized,planned in zip(optimized_distances_by_plan,planned_distances_by_plan):\n",
    "        gap = planned - optimized\n",
    "        gaps = np.append(gaps,gap)\n",
    "    total_gap = np.sum(gaps)\n",
    "    total_planned = np.sum(planned_distances_by_plan)\n",
    "    ratio = total_gap / total_planned\n",
    "    return ratio\n",
    "\n",
    "def getClusterJumpRatio(optimized_orders_by_plan, cordinates_list):\n",
    "    gaps = 0\n",
    "    totals = 0\n",
    "    for order, cordinates in zip(optimized_orders_by_plan,cordinates_list):\n",
    "        days = []\n",
    "        for _ in cordinates:\n",
    "            days.append(len(_))\n",
    "        days = np.array(days) - 1 #\n",
    "        #print(days)\n",
    "        optimzied_cluster_count = len(days) #\n",
    "        #print(optimzied_cluster_count)\n",
    "\n",
    "        totalplaces = optimzied_cluster_count + len(order)\n",
    "        #print(totalplaces)\n",
    "        candidates = list(range(totalplaces))\n",
    "        #print(candidates)\n",
    "        \n",
    "        cluster_list = [] #\n",
    "        for cand in candidates:\n",
    "            if cand in order:\n",
    "                index = order.index(cand)\n",
    "                clusterNumber = getcluster(index,days)\n",
    "                cluster_list.append(clusterNumber)\n",
    "        #print(cluster_list)\n",
    "\n",
    "        cluster_set =  makeClusterSet(cluster_list,days)\n",
    "        #print(cluster_set)\n",
    "\n",
    "        cluster_visited_count = 0\n",
    "        for cluster in cluster_set:\n",
    "            cluster_visited_count += len(cluster)\n",
    "        #print(cluster_visited_count)\n",
    "\n",
    "        gaps += cluster_visited_count - optimzied_cluster_count\n",
    "        totals += optimzied_cluster_count\n",
    "    #print(gaps,totals)\n",
    "    return gaps/totals\n",
    "\n",
    "def getcluster(index,days):\n",
    "    clusterNumber = 0\n",
    "    for day in days:\n",
    "        index = index - day\n",
    "        if index < 0:\n",
    "            return clusterNumber\n",
    "        else:\n",
    "            clusterNumber += 1\n",
    "\n",
    "def makeClusterSet(cluster_list,days):\n",
    "    cluster_sets = []\n",
    "    for day in days:\n",
    "        cluster = []\n",
    "        n = day\n",
    "        while n > 0:\n",
    "            cluster.append(cluster_list[0])\n",
    "            cluster_list.pop(0)\n",
    "            n -= 1\n",
    "        cluster_sets.append(set(cluster))\n",
    "    return cluster_sets\n",
    "\n",
    "def planwiseTSP(model, task, numPlan):\n",
    "    optimized_distances_by_plan = []\n",
    "    optimized_orders_by_plan = []\n",
    "    planned_distances_by_plan = []\n",
    "    cordinates_list = []\n",
    "\n",
    "    ave_att_per_day = 0\n",
    "    total_days = 0\n",
    "    total_att = 0\n",
    "\n",
    "    with open(f'Output/{model}/evals/{task}.jsonl', 'r') as f:\n",
    "        plans = [json.loads(line) for line in f]\n",
    "\n",
    "    for i in range(numPlan):\n",
    "        \n",
    "        if i%20 == 0:\n",
    "            print(\"Mode: Plan wise. we are at plan: \", i)\n",
    "        plan = plans[i]['plan'] \n",
    "        \n",
    "        # Failure rate related\n",
    "        # prepare a result list to return\n",
    "        # outofpool, missinginfo,\n",
    "        # prepare the evaluation for each plan, search the business id\n",
    "        plan_eval = prepareEval(plan)\n",
    "        #if(plan_eval)\n",
    "        if plan_eval[0]['accommodation'] == -1 or plan_eval[0]['accommodation'] == -2:\n",
    "            continue\n",
    "        \n",
    "        #get the cordinates\n",
    "        cordinates = populateCordinates(plan_eval, attractions, hotels)\n",
    "        cordinates_list.append(cordinates)\n",
    "        total_days += len(cordinates)\n",
    "        #print(len(cordinates))\n",
    "\n",
    "        distance_matrix = getDistanceMatrix_by_plan(cordinates)\n",
    "        \n",
    "        optimized_distance, info_lists = getOptimizedDistance_by_plan(cordinates,distance_matrix)\n",
    "        \n",
    "        optimized_distances_by_plan.append(optimized_distance)\n",
    "        \n",
    "        optimized_order = getOptimizedOrder_by_plan(info_lists)\n",
    "        #print(optimized_order)\n",
    "        total_att+=len(optimized_order)\n",
    "\n",
    "        optimized_orders_by_plan.append(optimized_order)\n",
    "        \n",
    "\n",
    "        planned_distance = getPlannedDistance_by_plan(cordinates, distance_matrix)\n",
    "        planned_distances_by_plan.append(planned_distance)\n",
    "\n",
    "    distance_gap_ratio_by_plan = getDistanceGapRatio_by_plan(optimized_distances_by_plan, planned_distances_by_plan)\n",
    "    cluster_jump_ratio_by_plan = getClusterJumpRatio(optimized_orders_by_plan, cordinates_list)\n",
    "    ave_att_per_day = total_att / total_days\n",
    "    return distance_gap_ratio_by_plan,cluster_jump_ratio_by_plan,ave_att_per_day\n",
    "\n",
    "def paraacc(log,eval):\n",
    "    #attractions\n",
    "    att_deno = 2\n",
    "    att_num = 2\n",
    "    for step in reversed(log):\n",
    "        if step['state'] == 'Successful':\n",
    "            if \"AttractionSearch\" in step['action']:\n",
    "                full = str(step['action'])\n",
    "                pattern = r'\\[.*\\]'\n",
    "                match = re.search(pattern, full)\n",
    "                if(match):\n",
    "                    preferences = match.group(0).lower()\n",
    "                    #print(preferences)\n",
    "                \n",
    "                pattern2 = r'\\[(.*),\\s*\\[(.*)\\]\\]'\n",
    "                match = re.search(pattern2, preferences)\n",
    "                if match:\n",
    "                    budget = match.group(1).strip()\n",
    "                    pref = match.group(2).strip()\n",
    "                    #print(budget, pref)\n",
    "                    pref_list = pref.split(', ')\n",
    "                    #print(pref_list)\n",
    "                if budget != eval['price'][0].lower():\n",
    "                    att_num -= 1\n",
    "                for p in pref_list:\n",
    "                    if p not in eval['attraction']:\n",
    "                        att_num -= 1\n",
    "\n",
    "    #accommodation\n",
    "    hotel_deno = 0\n",
    "    hotel_num = 0\n",
    "    for step in reversed(log):\n",
    "        if step['state'] == 'Successful':\n",
    "            if \"AccommodationSearch\" in step['action']:\n",
    "                full = str(step['action'])\n",
    "                pattern = r'\\[.*\\]'\n",
    "                match = re.search(pattern, full)\n",
    "                if(match):\n",
    "                    preferences = match.group(0).lower()\n",
    "                    #print(preferences)\n",
    "                \n",
    "                pattern2 = r'\\[(.*),\\s*\\[(.*)\\]\\]'\n",
    "                match = re.search(pattern2, preferences)\n",
    "                if match:\n",
    "                    budget = match.group(1).strip()\n",
    "                    pref = match.group(2).strip()\n",
    "                    #print(budget, pref)\n",
    "                    pref_list = pref.split(', ')\n",
    "                    #print(pref_list)\n",
    "                    hotel_deno = 1 + len(pref_list)\n",
    "                    hotel_num = hotel_deno\n",
    "                    #print(hotel_deno)\n",
    "                if budget != eval['price'][0].lower():\n",
    "                    hotel_num -= 1\n",
    "                for p in pref_list:\n",
    "                    if p not in eval['hotel']:\n",
    "                        hotel_num -= 1\n",
    "\n",
    "    #restaurant\n",
    "    res_deno = 0\n",
    "    res_num = 0\n",
    "    for step in reversed(log):\n",
    "        if step['state'] == 'Successful':\n",
    "            if \"RestaurantSearch\" in step['action']:\n",
    "                full = str(step['action'])\n",
    "                full = 'Action 3: RestaurantSearch[Moderate Budget, Vietnamese, [Good Flavor, Good Value]]'\n",
    "                pattern = r'\\[.*\\]'\n",
    "                match = re.search(pattern, full)\n",
    "                if(match):\n",
    "                    preferences = match.group(0).lower()\n",
    "                    #print(preferences)\n",
    "                \n",
    "                pattern2 = r'\\[(.*),(.*),\\s*\\[(.*)\\]\\]'\n",
    "                match = re.search(pattern2, preferences)\n",
    "                if match:\n",
    "                    budget = match.group(1).strip()\n",
    "                    cuisine = match.group(2).strip()\n",
    "                    pref = match.group(3).strip()\n",
    "                    #print(budget, cuisine, pref)\n",
    "                    pref_list = pref.split(', ')\n",
    "                    #print(pref_list)\n",
    "                    res_deno = 2 + len(pref_list)\n",
    "                    res_num = res_deno\n",
    "                    #print(res_deno)\n",
    "                if budget != eval['price'][0].lower():\n",
    "                    res_num -= 1\n",
    "                if cuisine != eval['cuisine'][0].lower():\n",
    "                    res_num -= 1\n",
    "                for p in pref_list:\n",
    "                    if p not in eval['restaurant']:\n",
    "                        res_num -= 1\n",
    "\n",
    "\n",
    "    \n",
    "    return res_num + att_num + hotel_num , res_deno + att_deno + hotel_deno\n",
    "\n",
    "def getParameterACC(model,numPlan):\n",
    "    allnum = 0\n",
    "    alldeno = 0\n",
    "    with open (f'Output/{model}/plans/toolUseLogs.jsonl', 'r') as f:\n",
    "        logs = [json.loads(line.strip()) for line in f]\n",
    "    with open (f'Prompts/evals.jsonl', 'r') as f:\n",
    "        evals = [json.loads(line.strip()) for line in f]\n",
    "    \n",
    "    for log,eval in zip(logs,evals):\n",
    "        #print(eval['eval_info'])\n",
    "        num,deno = paraacc(log['log'],eval['eval_info'])\n",
    "        allnum += num\n",
    "        alldeno += deno\n",
    "\n",
    "    rate = allnum/alldeno\n",
    "    return rate\n",
    "\n",
    "def getValidRate(model,task,numPlan,passRate):\n",
    "    \n",
    "    with open(f'Output/{model}/evals/{task}.jsonl', 'r') as f:\n",
    "        plans = [json.loads(line) for line in f]\n",
    "\n",
    "    with open(f'Prompts/evals.jsonl', 'r') as f:\n",
    "            evals = [json.loads(line) for line in f]\n",
    "\n",
    "    validated = 0\n",
    "\n",
    "    for i in range(numPlan):\n",
    "        plan = plans[i]['plan']\n",
    "        eval = evals[i]['eval_info']\n",
    "        \n",
    "        # Failure rate related\n",
    "        # prepare a result list to return\n",
    "        # outofpool, missinginfo,\n",
    "        results = []\n",
    "        # prepare the evaluation for each plan, search the business id\n",
    "        plan_eval = prepareEval(plan)\n",
    "\n",
    "\n",
    "        #Failure Rate\n",
    "        outsidepool = evaluate_outSidePool(plan_eval)\n",
    "        results.append(outsidepool)\n",
    "\n",
    "\n",
    "        missingInfo = evaluate_missingInfo(plan_eval)\n",
    "        results.append(missingInfo)\n",
    "        \n",
    "        if results != [0,0]:\n",
    "            continue\n",
    "        \n",
    "        #Preference match\n",
    "        results = []\n",
    "\n",
    "        #day\n",
    "        day_numerator, day_denominator = evaluate_day(plan_eval,eval)\n",
    "        results.append([day_numerator, day_denominator])\n",
    "\n",
    "        #price\n",
    "        price_numerator, price_denominator = evaluate_price(plan_eval,eval)\n",
    "        results.append([price_numerator, price_denominator])\n",
    "\n",
    "        #attraction orientation\n",
    "        attraction_numerator, attraction_denominator = evaluate_attraction_orientation(plan_eval,eval)\n",
    "        results.append([attraction_numerator, attraction_denominator])\n",
    "        \n",
    "        #cuisine\n",
    "        cuisine_numerator, cuisine_denominator = evaluate_cuisine(plan_eval,eval)\n",
    "        results.append([cuisine_numerator, cuisine_denominator])\n",
    "\n",
    "        #restaurants\n",
    "        restaurants_numerator, restaurants_denominator = evaluate_restaurants(plan_eval,eval)\n",
    "        results.append([restaurants_numerator, restaurants_denominator])\n",
    "\n",
    "        #hotels\n",
    "        hotels_numerator, hotels_denominator = evaluate_hotels(plan_eval,eval)\n",
    "        results.append([hotels_numerator, hotels_denominator])\n",
    "\n",
    "        if(getOneMacro(results,passRate)):\n",
    "            validated += 1\n",
    "            \n",
    "\n",
    "\n",
    "    return validated/numPlan\n",
    "\n",
    "def getOneMacro(results,passRate):\n",
    "    #print(results) #[[1, 1], [11, 16], [8, 8], [4, 6], [10, 12], [4, 4]]\n",
    "\n",
    "    for cat in results:\n",
    "        #print(cat)\n",
    "        if cat[0] == cat[1] == 0:\n",
    "            continue\n",
    "        \n",
    "        if cat[0] / cat[1] < passRate:\n",
    "            return False\n",
    "\n",
    "    return True\n",
    "\n",
    "def getRatio(failure_list, preference_list, passRate):\n",
    "    result = []\n",
    "    OOP = failure_list[0][0]\n",
    "    MI  = failure_list[0][1]\n",
    "    Day = preference_list[0][0]\n",
    "    Price = preference_list[0][1]\n",
    "    Attraction = preference_list[0][2]\n",
    "    Cuisine = preference_list[0][3]\n",
    "    Restaurant = preference_list[0][4]\n",
    "    Hotel = preference_list[0][5]\n",
    "    #print(OOP,MI,Day,Price,Attraction,Cuisine,Restaurant,Hotel)\n",
    "    \n",
    "    if OOP > 0:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0)\n",
    "\n",
    "    if MI > 0:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0)\n",
    "        \n",
    "    if Day[0]/Day[1] < passRate:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0)\n",
    "    \n",
    "    if Price[0]/Price[1] < passRate:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0)\n",
    "\n",
    "    if Attraction[0]/Attraction[1] < passRate:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0) \n",
    "\n",
    "    if Cuisine[0]/Cuisine[1] < passRate:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0)\n",
    "\n",
    "    if Restaurant[0]/Restaurant[1] < passRate:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0)\n",
    "\n",
    "    if Hotel[0]/Hotel[1] < passRate:\n",
    "        result.append(1)\n",
    "    else:\n",
    "        result.append(0)\n",
    "\n",
    "    return result\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    #load datas\n",
    "    with open ('Dataset/gpt4o/restaurants.jsonl', 'r') as file:\n",
    "        restaurants = [json.loads(line.strip()) for line in file]\n",
    "\n",
    "    with open ('Dataset/gpt4o/hotels.jsonl', 'r') as file:\n",
    "        hotels = [json.loads(line.strip()) for line in file]\n",
    "\n",
    "    with open ('Dataset/gpt4o/attractions.jsonl', 'r') as file:\n",
    "        attractions = [json.loads(line.strip()) for line in file]\n",
    "\n",
    "    modelList = ['gpt4o','mistral','llama318b']\n",
    "    taskList = ['allDataNoRoute','allDataRouteOP','filteredDataRouteOP','toolUsePlans','baseData']\n",
    "\n",
    "    #choose model and task\n",
    "    model = modelList[0]\n",
    "    task = taskList[2]\n",
    "    print(\"==Model: \", model,\"==\")\n",
    "    print(\"==Task: \", task,\"==\")\n",
    "     \n",
    "    #failure and preference\n",
    "    numPlan = 200\n",
    "    wrongLists = []\n",
    "    for i in range(numPlan):\n",
    "        planIndex = i\n",
    "        passRate = 0.75\n",
    "        failure_list, preference_list = getFailureAndPreferenceList(model,task,planIndex)\n",
    "        wrongList = getRatio(failure_list, preference_list,passRate)\n",
    "        wrongLists.append(wrongList)\n",
    "    \n",
    "    result = [sum(col) for col in zip(*wrongLists)]\n",
    "    result_normalized = [x/sum(result) for x in result]\n",
    "    print(result_normalized)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "torchgpu",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.11"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
