{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 81,
   "metadata": {},
   "outputs": [
    {
     "ename": "ValueError",
     "evalue": "'a' cannot be empty unless no samples are taken",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mValueError\u001b[0m                                Traceback (most recent call last)",
      "Cell \u001b[1;32mIn[81], line 174\u001b[0m\n\u001b[0;32m    172\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m    173\u001b[0m     allow_replace \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n\u001b[1;32m--> 174\u001b[0m res_finals \u001b[38;5;241m=\u001b[39m np\u001b[38;5;241m.\u001b[39mrandom\u001b[38;5;241m.\u001b[39mchoice(res_cands, size\u001b[38;5;241m=\u001b[39mresNumber, replace\u001b[38;5;241m=\u001b[39mallow_replace)\n\u001b[0;32m    175\u001b[0m att_finals \u001b[38;5;241m=\u001b[39m np\u001b[38;5;241m.\u001b[39mrandom\u001b[38;5;241m.\u001b[39mchoice(att_cands, size\u001b[38;5;241m=\u001b[39mattNumber, replace\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mFalse\u001b[39;00m)\n\u001b[0;32m    176\u001b[0m hotel_finals \u001b[38;5;241m=\u001b[39m np\u001b[38;5;241m.\u001b[39mrandom\u001b[38;5;241m.\u001b[39mchoice(hotel_cands, size\u001b[38;5;241m=\u001b[39mhotelNumber, replace\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mFalse\u001b[39;00m)\n",
      "File \u001b[1;32mnumpy\\\\random\\\\mtrand.pyx:951\u001b[0m, in \u001b[0;36mnumpy.random.mtrand.RandomState.choice\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;31mValueError\u001b[0m: 'a' cannot be empty unless no samples are taken"
     ]
    }
   ],
   "source": [
    "import json\n",
    "import numpy as np\n",
    "\n",
    "\n",
    "def getRequirements(requirements):\n",
    "    day = requirements['day']\n",
    "    price = requirements['price']\n",
    "    attraction = requirements['attraction']\n",
    "    cuisine = requirements['cuisine']\n",
    "    restaurant = requirements['restaurant']\n",
    "    hotel = requirements['hotel']\n",
    "    return day, price, attraction, cuisine, restaurant,hotel\n",
    "\n",
    "def mapBudget(price):\n",
    "    if price[0] == 'expensive budget':\n",
    "        return ['$$','$$$','$$$$']\n",
    "    if price[0] == 'moderate budget':\n",
    "        return ['$','$$','$$$']\n",
    "    if price[0] == 'cheap budget':\n",
    "        return ['$','$$']\n",
    "\n",
    "def mapRes(restaurant):\n",
    "    #['good freshness', 'good environment']\n",
    "    limits = []\n",
    "    for lim in restaurant:\n",
    "        limits.append(lim.split(' ')[1])\n",
    "    return limits\n",
    "\n",
    "def getResList(price, cuisine, restaurant, restaurants):\n",
    "    res_cands = []\n",
    "    price_limit = mapBudget(price)\n",
    "    res_limit = mapRes(restaurant)\n",
    "\n",
    "    if cuisine == ['US']:\n",
    "        cuisine = ['American','American (New)','American (Traditional)']\n",
    "    for res in restaurants:\n",
    "        if res['price'] != None and res['price'] in price_limit:\n",
    "            if res['cuisine_1'] in cuisine or res['cuisine_2'] in cuisine:\n",
    "                for lim in res_limit:\n",
    "                    if (res[lim] == 'good '+ lim) or (res[lim] == 'excellent ' + lim):\n",
    "                        res_cands.append(res)\n",
    "    return res_cands\n",
    "\n",
    "def getAttList(price, attraction, attractions):\n",
    "    att_cands = []\n",
    "    price_limit = mapBudget(price)\n",
    "    for att in attractions:\n",
    "        if att['price'] in price_limit:\n",
    "            if att[attraction[0]] == 'medium ' + attraction[0] or att[attraction[0]] == 'high ' + attraction[0]:\n",
    "                att_cands.append(att)\n",
    "            #if att[attraction]\n",
    "    return att_cands\n",
    "\n",
    "def mapHot(hotel):\n",
    "    limits = []\n",
    "    for lim in hotel:\n",
    "        limits.append(lim.split(' ')[1])\n",
    "    return limits\n",
    "\n",
    "def getHotelList(price, hotel, hotels):\n",
    "    hotel_cands = []\n",
    "    price_limit = mapBudget(price)\n",
    "    hotel_limit = mapHot(hotel)\n",
    "    for hot in hotels:\n",
    "        if hot['price'] in price_limit:\n",
    "            for lim in hotel_limit:\n",
    "                if (hot[lim] == 'good '+ lim) or (hot[lim] == 'excellent ' + lim):\n",
    "                    hotel_cands.append(hot)\n",
    "    return hotel_cands\n",
    "\n",
    "def euclidean_distance(coord1, coord2):\n",
    "    return ((coord1[0] - coord2[0]) ** 2 + (coord1[1] - coord2[1]) ** 2) ** 0.5\n",
    "\n",
    "def arrangeRoute(day, att_finals, hotel_finals):\n",
    "    att_cords = []\n",
    "    hotel_cords = []\n",
    "\n",
    "    for i in att_finals:\n",
    "        att_cords.append([i['latitude'],i['longitude']])\n",
    "    for i in hotel_finals:\n",
    "        hotel_cords.append([i['latitude'],i['longitude']])\n",
    "\n",
    "    orders = naive_route(day, att_cords, hotel_cords)\n",
    "    orders = np.array(orders).flatten()\n",
    "    att_order = []\n",
    "    for o in orders:\n",
    "        att_order.append(att_finals[o])\n",
    "    return att_order\n",
    "\n",
    "def naive_route(days, att_coords, hotel_coords):\n",
    "    if len(att_coords) < days * 4:\n",
    "        raise ValueError(\"Not enough attractions to cover all days\")\n",
    "    \n",
    "    hotel = tuple(hotel_coords[0])\n",
    "    remaining_indices = set(range(len(att_coords)))\n",
    "    full_plan = []\n",
    "    \n",
    "    for _ in range(days):\n",
    "        if len(remaining_indices) < 4:\n",
    "            break\n",
    "        \n",
    "        # Start from the closest attraction to the hotel\n",
    "        first_index = min(remaining_indices, key=lambda i: euclidean_distance(hotel, att_coords[i]))\n",
    "        day_route = [first_index]\n",
    "        remaining_indices.remove(first_index)\n",
    "        \n",
    "        # Greedily choose the next closest attractions\n",
    "        current_index = first_index\n",
    "        for _ in range(3):  # Visit 4 attractions in total\n",
    "            next_index = min(remaining_indices, key=lambda i: euclidean_distance(att_coords[current_index], att_coords[i]))\n",
    "            day_route.append(next_index)\n",
    "            remaining_indices.remove(next_index)\n",
    "            current_index = next_index\n",
    "        \n",
    "        full_plan.append(day_route)\n",
    "    \n",
    "    return full_plan\n",
    "\n",
    "def parseEval(res_info, att_info, hotel_info):\n",
    "    itinerary = []\n",
    "    \n",
    "    # Ensure there's enough data for at least one day\n",
    "    days = min(len(res_info) // 3, len(att_info) // 4)\n",
    "    \n",
    "    for i in range(days):\n",
    "        day_plan = {\n",
    "            \"days\": str(i + 1),\n",
    "            \"breakfast\": {\"name\": res_info[i * 3][0], \"address\": res_info[i * 3][1]},\n",
    "            \"morning_attractions\": [{\"name\": att_info[i * 4][0], \"address\": att_info[i * 4][1]}],\n",
    "            \"lunch\": {\"name\": res_info[i * 3 + 1][0], \"address\": res_info[i * 3 + 1][1]},\n",
    "            \"afternoon_attractions\": [\n",
    "                {\"name\": att_info[i * 4 + 1][0], \"address\": att_info[i * 4 + 1][1]},\n",
    "                {\"name\": att_info[i * 4 + 2][0], \"address\": att_info[i * 4 + 2][1]}\n",
    "            ],\n",
    "            \"dinner\": {\"name\": res_info[i * 3 + 2][0], \"address\": res_info[i * 3 + 2][1]},\n",
    "            \"night_attractions\": [{\"name\": att_info[i * 4 + 3][0], \"address\": att_info[i * 4 + 3][1]}],\n",
    "            \"accommodation\": {\"name\": hotel_info[0][0], \"address\": hotel_info[0][1]}\n",
    "        }\n",
    "        itinerary.append(day_plan)\n",
    "    \n",
    "    return {\"index\": 1, \"plan\": {\"itinerary\": itinerary}}\n",
    "\n",
    "\n",
    "with open('Prompts/evals.jsonl', 'r') as f:\n",
    "    evals = [json.loads(line.strip()) for line in f]\n",
    "\n",
    "with open ('Dataset/gpt4o/attractions.jsonl', 'r') as f:\n",
    "    attractions = [json.loads(line.strip()) for line in f]\n",
    "\n",
    "with open('Dataset/gpt4o/hotels.jsonl', 'r') as f:\n",
    "    hotels = [json.loads(line.strip()) for line in f]\n",
    "\n",
    "with open('Dataset/gpt4o/restaurants.jsonl', 'r') as f:\n",
    "    restaurants = [json.loads(line.strip()) for line in f]\n",
    "\n",
    "numPlan = 100\n",
    "\n",
    "for i in range(numPlan):\n",
    "    requirements = evals[i]['eval_info']\n",
    "    day, price, attraction, cuisine, restaurant,hotel = getRequirements(requirements)\n",
    "\n",
    "    res_cands = getResList(price, cuisine, restaurant,restaurants)\n",
    "    att_cands = getAttList(price, attraction,attractions)\n",
    "    hotel_cands = getHotelList(price, hotel,hotels)\n",
    "\n",
    "    resNumber = int(day[0][0]) * 3\n",
    "    attNumber = int(day[0][0]) * 4\n",
    "    hotelNumber = 1\n",
    "    #random select from candidates\n",
    "    if(resNumber > len(res_cands)):\n",
    "        allow_replace = True\n",
    "    else:\n",
    "        allow_replace = False\n",
    "    res_finals = np.random.choice(res_cands, size=resNumber, replace=allow_replace)\n",
    "    att_finals = np.random.choice(att_cands, size=attNumber, replace=False)\n",
    "    hotel_finals = np.random.choice(hotel_cands, size=hotelNumber, replace=False)\n",
    "    \n",
    "    #get the route calculated naively\n",
    "    attOrder = arrangeRoute(int(day[0][0]),att_finals, hotel_finals)\n",
    "\n",
    "    res_info = [[i['name'],i['address']] for i in res_finals]\n",
    "    att_info = [[i['name'],i['address']] for i in attOrder]\n",
    "    hotel_info = [[i['name'],i['address']] for i in hotel_finals]\n",
    "    \n",
    "    parsed_eval = parseEval(res_info, att_info, hotel_info)\n",
    "\n",
    "    with open('Output/greedy/evals/filteredDataRouteOP.jsonl', 'a') as f:\n",
    "        f.write(json.dumps(parsed_eval) + '\\n')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# cuisine like Irish cannot be satisfied.\n",
    "# there's something wrong with the plan generator\n",
    "#there is something wrong with the actual evaluation"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "torchgpu",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
