{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 86,
   "id": "1d0e8c96-9e0b-418f-972c-e188bc055248",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle\n",
    "\n",
    "for data in ['bank77', 'clinic', 'goemo' , 'massive_I', 'massive_D']:\n",
    "    results_dict = {}\n",
    "\n",
    "    for emb_type in ['distilbert', 'sbert', 'openai', 'e5-large']:\n",
    "        # Open the pickle file in read-binary mode\n",
    "        with open(\"sims_offline_results_\" + emb_type + \"_\" + data + \".pkl\", \"rb\") as file:\n",
    "            cur_results = pickle.load(file)\n",
    "        results_dict[emb_type] = cur_results[emb_type]\n",
    "        \n",
    "    for llm_type in ['gpt-3.5-turbo','llama3.3-70b','deepseek-chat','claude-3-7-sonnet-20250219']:\n",
    "\n",
    "        try:\n",
    "            # Open the pickle file in read-binary mode\n",
    "            with open(\"sims_offline_results_\" + llm_type + \"_\" + data + \".pkl\", \"rb\") as file:\n",
    "                cur_results = pickle.load(file)\n",
    "            \n",
    "            results_dict[llm_type] = cur_results\n",
    "        except:\n",
    "            continue\n",
    "\n",
    "    for nlp_type in ['textrank','centroid','lsa']:\n",
    "\n",
    "        try:\n",
    "            # Open the pickle file in read-binary mode\n",
    "            with open(\"sims_offline_results_nlp_\" + nlp_type + '_' + data + \".pkl\", \"rb\") as file:\n",
    "                cur_results = pickle.load(file)\n",
    "            \n",
    "            results_dict[nlp_type] = cur_results\n",
    "        except:\n",
    "            continue\n",
    "\n",
    "    # Open the pickle file in read-binary mode\n",
    "    with open(\"sims_offline_results_traditional_clustering_\" + data + \".pkl\", \"rb\") as file:\n",
    "        cur_results = pickle.load(file)\n",
    "\n",
    "    for emb_type in ['distilbert', 'sbert', 'openai', 'e5-large']:\n",
    "        results_dict[emb_type]['GMM'] = cur_results[emb_type]['GMM']\n",
    "        results_dict[emb_type]['Agglomerative'] = cur_results[emb_type]['Agglomerative']\n",
    "        results_dict[emb_type]['Spectral'] = cur_results[emb_type]['Spectral']\n",
    "        \n",
    "    with open(\"results_\" + data + \".pkl\", \"wb\") as f:\n",
    "        pickle.dump(results_dict, f)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "bbcf9a87-233c-42b0-818d-5fa101f57d0f",
   "metadata": {},
   "outputs": [],
   "source": [
    "results_llms = {\n",
    "    'Instructor': {\n",
    "        'clinic': {'ACC': 79.29, 'NMI': 92.60},\n",
    "        'MTOP(I)': {'ACC': 33.35, 'NMI': 70.63},\n",
    "        'massive_I': {'ACC': 54.08, 'NMI': 73.42},\n",
    "        'goemo': {'ACC': 25.19, 'NMI': 21.54},\n",
    "        'CLINC(D)': {'ACC': 52.50, 'NMI': 56.87},\n",
    "        'MTOP(D)': {'ACC': 90.56, 'NMI': 87.30},\n",
    "        'massive_D': {'ACC': 61.81, 'NMI': 67.31},\n",
    "    },\n",
    "    'SCCL': {\n",
    "        'clinic': {'ACC': 80.85, 'NMI': 92.94},\n",
    "        'MTOP(I)': {'ACC': 34.28, 'NMI': 73.52},\n",
    "        'massive_I': {'ACC': 54.10, 'NMI': 73.90},\n",
    "        'goemo': {'ACC': 34.33, 'NMI': 30.54},\n",
    "        'CLINC(D)': {'ACC': 54.22, 'NMI': 60.88},\n",
    "        'MTOP(D)': {'ACC': 89.08, 'NMI': 84.77},\n",
    "        'massive_D': {'ACC': 61.34, 'NMI': 68.69},\n",
    "    },\n",
    "    'Self-supervise-I': {\n",
    "        'clinic': {'ACC': 80.82, 'NMI': 93.88},\n",
    "        'MTOP(I)': {'ACC': 34.06, 'NMI': 72.50},\n",
    "        'massive_I': {'ACC': 55.07, 'NMI': 72.88},\n",
    "        'goemo': {'ACC': 24.11, 'NMI': 22.05},\n",
    "        'CLINC(D)': {'ACC': 58.58, 'NMI': 60.84},\n",
    "        'MTOP(D)': {'ACC': 92.12, 'NMI': 88.49},\n",
    "        'massive_D': {'ACC': 53.97, 'NMI': 71.53},\n",
    "    },\n",
    "    'ClusterLLM-I': {\n",
    "        'clinic': {'ACC': 82.77, 'NMI': 93.88},\n",
    "        'MTOP(I)': {'ACC': 35.84, 'NMI': 73.52},\n",
    "        'massive_I': {'ACC': 59.89, 'NMI': 76.96},\n",
    "        'goemo': {'ACC': 27.49, 'NMI': 24.78},\n",
    "        'CLINC(D)': {'ACC': 53.49, 'NMI': 59.98},\n",
    "        'MTOP(D)': {'ACC': 93.53, 'NMI': 89.36},\n",
    "        'massive_D': {'ACC': 61.06, 'NMI': 68.62},\n",
    "    },\n",
    "    'ClusterLLM': {\n",
    "        'clinic': {'ACC': 83.8, 'NMI': 94.0, 'Queries':1618},\n",
    "        'MTOP(I)': {'ACC': 35.0, 'NMI': 73.83, 'Queries':1618},\n",
    "        'massive_I': {'ACC': 60.7, 'NMI': 77.64, 'Queries':1618},\n",
    "        'goemo': {'ACC': 26.8, 'NMI': 23.9, 'Queries':1618},\n",
    "        'CLINC(D)': {'ACC': 51.82, 'NMI': 54.81, 'Queries':1618},\n",
    "        'MTOP(D)': {'ACC': 92.13, 'NMI': 89.23, 'Queries':1618},\n",
    "        'massive_D': {'ACC': 60.9, 'NMI': 68.8, 'Queries':1618},\n",
    "    },\n",
    "    'IDAS': {\n",
    "        'clinic': {'ACC': 81.4, 'NMI': 92.4, 'Queries':4650},\n",
    "        'MTOP(I)': {'ACC': 37.30, 'NMI': 72.31},\n",
    "        'massive_I': {'ACC': 63.01, 'NMI': 75.74,'Queries':3033},\n",
    "        'goemo': {'ACC': 30.6, 'NMI': 25.6, 'Queries':3011},\n",
    "        'CLINC(D)': {'ACC': 54.18, 'NMI': 63.82},\n",
    "        'MTOP(D)': {'ACC': 87.57, 'NMI': 87.30},\n",
    "        'massive_D': {'ACC': 53.5, 'NMI': 63.9, 'Queries':2992},\n",
    "    },\n",
    "    'LLMEdgeRefine': {\n",
    "        'clinic': {'ACC': 86.8, 'NMI': 94.9, 'Queries': 1350},\n",
    "        'MTOP(I)': {'ACC': 46.00, 'NMI': 72.92},\n",
    "        'massive_I': {'ACC': 63.42, 'NMI': 76.66, 'Queries': 892},\n",
    "        'goemo': {'ACC': 34.8, 'NMI': 29.7, 'Queries': 895},\n",
    "        'CLINC(D)': {'ACC': 59.40, 'NMI': 61.27},\n",
    "        'MTOP(D)': {'ACC': 92.8, 'NMI': 88.1},\n",
    "        'massive_D': {'ACC': 63.05, 'NMI': 68.67, 'Queries': 892},\n",
    "    },\n",
    "}\n",
    "\n",
    "queries = {'clinic':750,\n",
    "           'goemo':135,\n",
    "           'massive_D':90,\n",
    "           'massive_I':295}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 76,
   "id": "c9c95a59-7633-459d-bd73-c9b8f0c7ea01",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pickle\n",
    "results_summary = {}\n",
    "results_summary_std = {}\n",
    "\n",
    "for data in ['bank77', 'clinic', 'goemo' , 'massive_I', 'massive_D']:\n",
    "    results_summary[data] = {}\n",
    "    results_summary_std[data] = {}\n",
    "    \n",
    "    with open(\"results_\" + data + \".pkl\", \"rb\") as file:\n",
    "        results_dict = pickle.load(file)\n",
    "\n",
    "    #get gpt-4o original results multiple embeddings\n",
    "    llm_type = 'gpt-4o'\n",
    "    results_summary[data][llm_type] = {}\n",
    "    results_summary_std[data][llm_type] = {}\n",
    "    \n",
    "    for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "        results_summary[data][llm_type][emb_type] = {}\n",
    "        results_summary_std[data][llm_type][emb_type] = {}\n",
    "        \n",
    "        for i in ['kmeans','kmedoids']:\n",
    "            acc = []\n",
    "            nmi = []\n",
    "            cen = []\n",
    "            for seed in range(10):\n",
    "                cur_results = results_dict[emb_type][seed][i]['results']\n",
    "                acc.append(cur_results[0])\n",
    "                nmi.append(cur_results[1])\n",
    "                cen.append(cur_results[2])\n",
    "            acc = np.array(acc)\n",
    "            nmi = np.array(nmi)\n",
    "            cen = np.array(cen)    \n",
    "            results_summary[data][llm_type][emb_type][i] = list(np.round([100*np.mean(acc), 100*np.mean(nmi)],1)) + [np.round(np.mean(cen),3)]\n",
    "            results_summary_std[data][llm_type][emb_type][i] = list(np.round([np.std(100*acc), np.std(100*nmi)],2)) + [np.round(np.std(cen),3)]\n",
    "    \n",
    "        for force in [0, 10]:\n",
    "            for niter in [1,5]:\n",
    "                acc = []\n",
    "                nmi = []\n",
    "                cen = []\n",
    "                for seed in range(10):\n",
    "                    cur_results = results_dict[emb_type][seed][force][niter]['results']\n",
    "                    acc.append(cur_results[0])\n",
    "                    nmi.append(cur_results[1])\n",
    "                    cen.append(cur_results[2])\n",
    "                acc = np.array(acc)\n",
    "                nmi = np.array(nmi)\n",
    "                cen = np.array(cen)\n",
    "                results_summary[data][llm_type][emb_type][str(force) + '-' + str(niter)] = list(np.round([100*np.mean(acc), 100*np.mean(nmi)],1)) + [np.round(np.mean(cen),3)]\n",
    "                results_summary_std[data][llm_type][emb_type][str(force) + '-' + str(niter)] = list(np.round([np.std(100*acc), np.std(100*nmi)],2)) + [np.round(np.std(cen),3)]\n",
    "    \n",
    "    #get multiple LLMs results with e5-large\n",
    "    emb_type = 'e5-large'\n",
    "    force = 10\n",
    "    niter = 5\n",
    "    for llm_type in ['gpt-3.5-turbo','llama3.3-70b','deepseek-chat','claude-3-7-sonnet-20250219']:\n",
    "        if data=='bank77' and llm_type=='gpt-3.5-turbo':\n",
    "            continue\n",
    "        if data=='massive_I' and llm_type=='gpt-3.5-turbo':\n",
    "            continue\n",
    "        results_summary[data][llm_type] = {}\n",
    "        results_summary[data][llm_type][emb_type] = {}\n",
    "        results_summary_std[data][llm_type] = {}\n",
    "        results_summary_std[data][llm_type][emb_type] = {}\n",
    "        acc = []\n",
    "        nmi = []\n",
    "        cen = []\n",
    "        for seed in range(5):\n",
    "            cur_results = results_dict[llm_type][seed][force][niter]['results']\n",
    "            acc.append(cur_results[0])\n",
    "            nmi.append(cur_results[1])\n",
    "            cen.append(cur_results[2])\n",
    "        acc = np.array(acc)\n",
    "        nmi = np.array(nmi)\n",
    "        cen = np.array(cen)\n",
    "        results_summary[data][llm_type][emb_type][str(force) + '-' + str(niter)] = list(np.round([100*np.mean(acc), 100*np.mean(nmi)],1)) + [np.round(np.mean(cen),3)]\n",
    "        results_summary_std[data][llm_type][emb_type][str(force) + '-' + str(niter)] = list(np.round([np.std(100*acc), np.std(100*nmi)],2)) + [np.round(np.std(cen),3)]\n",
    "\n",
    "    #get multiple NLP results with all embeddings\n",
    "    \n",
    "    for nlp_type in ['textrank','centroid','lsa']:\n",
    "        results_summary[data][nlp_type] = {}\n",
    "        results_summary_std[data][nlp_type] = {}\n",
    "        \n",
    "        for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "            \n",
    "            results_summary[data][nlp_type][emb_type] = {}\n",
    "            results_summary_std[data][nlp_type][emb_type] = {}\n",
    "\n",
    "            \n",
    "            for top_k in [5, 10]:\n",
    "                for niter in [1,5]:\n",
    "\n",
    "                    acc = []\n",
    "                    nmi = []\n",
    "                    cen = []\n",
    "                    for seed in range(5):\n",
    "                        try:\n",
    "                            cur_results = results_dict[emb_type][seed][nlp_type][top_k][niter]['results']\n",
    "                        except:\n",
    "                            continue\n",
    "                        acc.append(cur_results[0])\n",
    "                        nmi.append(cur_results[1])\n",
    "                        cen.append(cur_results[2])\n",
    "\n",
    "                    acc = np.array(acc)\n",
    "                    nmi = np.array(nmi)\n",
    "                    cen = np.array(cen)\n",
    "                    results_summary[data][nlp_type][emb_type][str(top_k) + '-' + str(niter)] = list(np.round([100*np.mean(acc), 100*np.mean(nmi)],1)) + [np.round(np.mean(cen),3)]\n",
    "                    results_summary_std[data][nlp_type][emb_type][str(top_k) + '-' + str(niter)] = list(np.round([np.std(100*acc), np.std(100*nmi)],2)) + [np.round(np.std(cen),3)]\n",
    "    \n",
    "    for method in ['GMM','Agglomerative','Spectral']:\n",
    "        results_summary[data][method] = {}\n",
    "        results_summary_std[data][method] = {}\n",
    "        for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "            \n",
    "            results_summary[data][method][emb_type] = {}\n",
    "            results_summary_std[data][method][emb_type] = {}\n",
    "            acc = []\n",
    "            nmi = []\n",
    "            cen = []\n",
    "            for seed in range(10):\n",
    "                cur_results = results_dict[emb_type][method]['results']\n",
    "                acc.append(cur_results[0])\n",
    "                nmi.append(cur_results[1])\n",
    "                cen.append(cur_results[2])\n",
    "            acc = np.array(acc)\n",
    "            nmi = np.array(nmi)\n",
    "            cen = np.array(cen)\n",
    "            results_summary[data][method][emb_type] = list(np.round([100*np.mean(acc), 100*np.mean(nmi)],1)) + [np.round(np.mean(cen),3)]\n",
    "            results_summary_std[data][method][emb_type] = list(np.round([np.std(100*acc), np.std(100*nmi)],2)) + [np.round(np.std(cen),3)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "id": "7ab6242f-dd9a-4972-ab8f-285fa7a0c878",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'assignments': array([ 0, 11,  8, ..., 12, 12, 12]),\n",
       " 'results': [0.5907868190988568,\n",
       "  0.6358152784037107,\n",
       "  0.3624605336149584,\n",
       "  0.3624605336149584,\n",
       "  0.3624605336149584,\n",
       "  0.3624605336149584]}"
      ]
     },
     "execution_count": 84,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "results_dict[emb_type][method]"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f3e4987c-96a9-4eec-8dff-6d57b1b4417e",
   "metadata": {},
   "source": [
    "# Table including e5-large k-llmmenans-FS5 with multiple LLMs and other clustering"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 71,
   "id": "ccb9d65b-c981-4257-a08c-f70e7a71b440",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "k-LLMmeans &&&&&&&&&&&&\\\\\n",
      "\\quad \\emph{GPT-3.5}&{\\bf 750}&76.0&92.1&&{\\bf 135}&23.9&24.1&&{\\bf 90}&{\\bf 63.3}&66.2\\\\\n",
      "&&(1.16)&(0.28)&&&(0.65)&(0.39)&&&(1.47)&(0.62)\\\\\n",
      "\\quad \\emph{GPT-4o}&{\\bf 750}&77.2&92.5&&{\\bf 135}&24.2&24.3&&{\\bf 90}&62.3&65.9\\\\\n",
      "&&(1.6)&(0.4)&&&(0.76)&(0.7)&&&(1.36)&(0.78)\\\\\n",
      "\\quad \\emph{Llama-3.3}&{\\bf 750}&77.2&92.3&&{\\bf 135}&23.8&23.1&&{\\bf 90}&62.0&66.3\\\\\n",
      "&&(1.6)&(0.44)&&&(0.66)&(0.62)&&&(2.97)&(1.56)\\\\\n",
      "\\quad \\emph{DeepSeek-V3}&{\\bf 750}&69.7&90.8&&{\\bf 135}&22.8&22.7&&{\\bf 90}&62.6&66.3\\\\\n",
      "&&(1.02)&(0.29)&&&(1.68)&(0.88)&&&(2.24)&(0.71)\\\\\n",
      "\\quad \\emph{Claude-3.7}&{\\bf 750}&76.9&92.5&&{\\bf 135}&24.2&23.7&&{\\bf 90}&61.8&66.0\\\\\n",
      "&&(1.83)&(0.52)&&&(1.0)&(0.65)&&&(4.83)&(1.99)\\\\\n",
      "\\hline\n",
      "ClusterLLM&1618&83.8&94.0&&1618&26.8&23.9&&1618&60.9&{\\bf 68.8}\\\\\n",
      "IDAS&4650&81.4&92.4&&3011&30.6&25.6&&2992&53.5&63.9\\\\\n",
      "LLMEdgeRefine&1350&{\\bf 86.8}&{\\bf 94.9}&&895&{\\bf 34.8}&{\\bf 29.7}&&892&63.05&68.67\\\\\n",
      "\n"
     ]
    }
   ],
   "source": [
    "line = {}\n",
    "line_std = {}\n",
    "emb_type = 'e5-large'\n",
    "\n",
    "for data in ['clinic', 'goemo' , 'massive_D']:\n",
    "    prompts = []\n",
    "    acc = []\n",
    "    nmi = []\n",
    "\n",
    "    acc_std = []\n",
    "    nmi_std = []\n",
    "    \n",
    "    method_names = [] \n",
    "    \n",
    "    for llm_type in ['gpt-3.5-turbo','gpt-4o','llama3.3-70b','deepseek-chat','claude-3-7-sonnet-20250219']:\n",
    "\n",
    "        method = '10-5'\n",
    "      \n",
    "        cur_results = results_summary[data][llm_type][emb_type][method]\n",
    "        acc.append(cur_results[0])\n",
    "        nmi.append(cur_results[1])\n",
    "        prompts.append(queries[data])\n",
    "\n",
    "        cur_results_std = results_summary_std[data][llm_type][emb_type][method]\n",
    "        acc_std.append(cur_results_std[0])\n",
    "        nmi_std.append(cur_results_std[1])\n",
    "\n",
    "        if llm_type == 'llama3.3-70b':\n",
    "            llm = 'Llama-3.3'\n",
    "        elif llm_type == 'gpt-3.5-turbo':\n",
    "            llm = 'GPT-3.5'\n",
    "        elif llm_type == 'gpt-4o':\n",
    "            llm = 'GPT-4o'\n",
    "        elif llm_type == 'deepseek-chat':\n",
    "            llm = 'DeepSeek-V3'\n",
    "        elif llm_type == 'claude-3-7-sonnet-20250219':\n",
    "            llm = 'Claude-3.7'\n",
    "        method_names.append('\\\\quad \\\\emph{' + llm + '}')\n",
    "\n",
    "    # Find the maximum value\n",
    "    #val = max(acc)\n",
    "    #acc = [\"\\\\emph{{\\\\bf \"+str(x)+\"}}\" if x == val else x for x in acc]\n",
    "\n",
    "    #val = max(nmi)\n",
    "    #nmi = [\"\\\\emph{{\\\\bf\"+str(x)+\"}}\" if x == val else x for x in nmi]\n",
    "\n",
    "    val = max(prompts)\n",
    "    prompts =  [f\"{{\\\\bf {x}}}\" if x == val else x for x in prompts]\n",
    "\n",
    "    acc_llms = []\n",
    "    nmi_llms = []\n",
    "    prompts_llms = []\n",
    "\n",
    "    for other_method in ['ClusterLLM','IDAS','LLMEdgeRefine']:\n",
    "        \n",
    "        acc_llms.append(results_llms[other_method][data]['ACC'])\n",
    "        nmi_llms.append(results_llms[other_method][data]['NMI'])\n",
    "        prompts_llms.append(results_llms[other_method][data]['Queries'])\n",
    "        \n",
    "        method_names.append(other_method)\n",
    "\n",
    "    acc = acc + acc_llms\n",
    "    nmi = nmi + nmi_llms\n",
    "    prompts = prompts + prompts_llms \n",
    "    \n",
    "    # Find the maximum value\n",
    "    val = max(acc)\n",
    "    acc = [f\"{{\\\\bf {x}}}\" if x == val else x for x in acc]\n",
    "\n",
    "    val = max(nmi)\n",
    "    nmi = [f\"{{\\\\bf {x}}}\" if x == val else x for x in nmi]\n",
    "\n",
    "\n",
    "    \n",
    "    for ii in range(len(method_names)):\n",
    "        cur_method = method_names[ii]\n",
    "        if data == 'clinic':\n",
    "            line[cur_method] = cur_method + '&' + str(prompts[ii]) + '&' + str(acc[ii]) + '&' + str(nmi[ii])# + '&' + str(cen[ii])\n",
    "            try:\n",
    "                line_std[cur_method] = '&' + \"\" + '&(' + str(acc_std[ii]) + ')&(' + str(nmi_std[ii]) + \")\"# + '&' + str(cen[ii])\n",
    "            except:\n",
    "                continue\n",
    "        else:\n",
    "            line[cur_method] = line[cur_method] + '&&' + str(prompts[ii]) + '&' + str(acc[ii]) + '&' + str(nmi[ii])# + '&' + str(cen[ii])\n",
    "            try:\n",
    "                line_std[cur_method] = line_std[cur_method] + '&&' + \"\" + '&(' + str(acc_std[ii]) + ')&(' + str(nmi_std[ii]) + \")\"# + '&' + str(cen[ii])\n",
    "            except:\n",
    "                continue\n",
    "appendix = True\n",
    "\n",
    "text = \"k-LLMmeans &&&&&&&&&&&&\\\\\\\\\\n\"\n",
    "for ii in range(len(method_names)):\n",
    "    cur_method = method_names[ii]\n",
    "    \n",
    "    text = text + line[cur_method] + '\\\\\\\\\\n'\n",
    "    if (appendix == True):\n",
    "        try:\n",
    "            text = text + line_std[cur_method] + '\\\\\\\\\\n'\n",
    "        except:\n",
    "            continue\n",
    "    if \"Claude\" in cur_method:\n",
    "        text = text + '\\\\hline\\n'\n",
    "print(text) "
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8e67396c-1166-4194-b378-073818d2a9e8",
   "metadata": {},
   "source": [
    "# Table including all klllmmeans kmeans, kmedoids and e5-large"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 74,
   "id": "9ac1e65f-4eda-4eb7-b0eb-2c984527457e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1.82]\n",
      "[1.82, 0.0]\n",
      "[1.82, 0.0, 0.0]\n",
      "[1.82, 0.0, 0.0, 0.0]\n",
      "[1.82, 0.0, 0.0, 0.0, 0.0]\n",
      "[1.83]\n",
      "[1.83, 0.0]\n",
      "[1.83, 0.0, 0.0]\n",
      "[1.83, 0.0, 0.0, 0.0]\n",
      "[1.83, 0.0, 0.0, 0.0, 0.0]\n",
      "[1.0]\n",
      "[1.0, 0.0]\n",
      "[1.0, 0.0, 0.0]\n",
      "[1.0, 0.0, 0.0, 0.0]\n",
      "[1.0, 0.0, 0.0, 0.0, 0.0]\n",
      "[4.03]\n",
      "[4.03, 0.0]\n",
      "[4.03, 0.0, 0.0]\n",
      "[4.03, 0.0, 0.0, 0.0]\n",
      "[4.03, 0.0, 0.0, 0.0, 0.0]\n",
      "[1.07]\n",
      "[1.07, 0.0]\n",
      "[1.07, 0.0, 0.0]\n",
      "[1.07, 0.0, 0.0, 0.0]\n",
      "[1.07, 0.0, 0.0, 0.0, 0.0]\n",
      "\\hline\n",
      "\\quad \\emph{textrank-single}&66.4&83.6&&78.7&92.4&&21.5&20.9&&60.6&68.9&&53.0&72.5\\\\\n",
      "&(0.94)&(0.47)&&(1.56)&(0.41)&&(0.63)&(0.29)&&(3.47)&(1.27)&&(1.8)&(0.71)\\\\\n",
      "\\quad \\emph{textrank-multiple}&66.8&83.9&&79.6&92.8&&21.6&21.0&&60.5&69.3&&53.7&72.8\\\\\n",
      "&(0.94)&(0.45)&&(1.51)&(0.45)&&(1.29)&(0.65)&&(3.66)&(1.22)&&(1.65)&(0.58)\\\\\n",
      "\\quad \\emph{centroid-single}&67.2&84.0&&78.5&92.2&&22.1&21.2&&60.9&68.3&&53.5&73.0\\\\\n",
      "&(0.81)&(0.39)&&(1.68)&(0.37)&&(0.6)&(0.41)&&(3.02)&(0.91)&&(2.07)&(1.13)\\\\\n",
      "\\quad \\emph{centroid-multiple}&67.5&84.0&&79.0&92.4&&21.4&21.1&&60.8&69.1&&54.3&73.5\\\\\n",
      "&(0.57)&(0.3)&&(1.95)&(0.46)&&(0.87)&(0.12)&&(2.72)&(1.09)&&(1.72)&(0.84)\\\\\n",
      "\\quad \\emph{lsa-single}&66.7&83.7&&78.8&92.5&&21.9&20.5&&61.2&68.7&&54.1&73.0\\\\\n",
      "&(0.99)&(0.47)&&(2.07)&(0.63)&&(1.11)&(0.87)&&(2.66)&(1.03)&&(1.86)&(0.91)\\\\\n",
      "\\quad \\emph{lsa-multiple}&67.1&84.0&&80.2&92.9&&22.3&20.2&&{\\bf 63.3}&70.0&&55.3&73.4\\\\\n",
      "&(0.98)&(0.42)&&(0.98)&(0.41)&&(0.85)&(0.56)&&(3.06)&(1.02)&&(1.32)&(0.72)\\\\\n",
      "\\quad \\emph{single}&67.1&83.6&&78.1&92.5&&24.0&{\\bf 22.3}&&61.1&69.6&&54.0&73.0\\\\\n",
      "&(1.22)&(0.46)&&(1.67)&(0.47)&&(1.35)&(0.57)&&(3.39)&(1.6)&&(1.51)&(0.58)\\\\\n",
      "\\quad \\emph{multiple}&66.7&83.6&&79.1&92.8&&24.1&22.1&&60.6&69.5&&55.8&73.5\\\\\n",
      "&(0.78)&(0.2)&&(1.68)&(0.48)&&(1.33)&(0.65)&&(2.82)&(1.66)&&(1.4)&(0.76)\\\\\n",
      "\\quad \\emph{FS-single}&67.5&83.8&&79.2&92.8&&23.0&21.9&&60.8&69.4&&55.3&73.6\\\\\n",
      "&(1.07)&(0.36)&&(1.73)&(0.43)&&(0.94)&(0.64)&&(3.21)&(1.09)&&(1.76)&(0.77)\\\\\n",
      "\\quad \\emph{FS-multiple}&67.9&{\\bf 84.1}&&80.2&{\\bf 93.1}&&{\\bf 24.2}&{\\bf 22.3}&&63.2&{\\bf 70.6}&&56.4&{\\bf 73.9}\\\\\n",
      "&(1.55)&(0.41)&&(1.52)&(0.32)&&(1.16)&(0.67)&&(2.84)&(1.38)&&(1.32)&(0.7)\\\\\n",
      "\\hline\n",
      "k-means&66.2&83.0&&77.3&92.0&&20.7&20.5&&59.4&67.9&&52.9&72.4\\\\\n",
      "&(1.82)&(0.56)&&(1.83)&(0.35)&&(1.0)&(0.67)&&(4.03)&(1.67)&&(1.07)&(0.54)\\\\\n",
      "k-medoids&41.7&69.5&&49.3&77.7&&15.7&15.9&&37.6&38.8&&35.9&52.4\\\\\n",
      "&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)\\\\\n",
      "GMM&67.7&83.0&&78.9&92.7&&21.5&20.6&&56.2&68.6&&53.9&73.2\\\\\n",
      "&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)\\\\\n",
      "Agglomerative&{\\bf 69.9}&83.7&&{\\bf 81.0}&92.5&&15.8&14.1&&62.8&67.1&&56.6&70.5\\\\\n",
      "&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)\\\\\n",
      "Spectral&68.2&83.3&&76.3&90.9&&17.6&15.2&&61.5&67.0&&{\\bf 56.7}&71.4\\\\\n",
      "&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)&&(0.0)&(0.0)\\\\\n",
      "\n"
     ]
    }
   ],
   "source": [
    "line = {}\n",
    "line_std = {}\n",
    "emb_type = 'openai'\n",
    "line[emb_type] = {}\n",
    "line_std[emb_type] = {}\n",
    "\n",
    "for data in ['bank77','clinic', 'goemo', 'massive_D','massive_I']:\n",
    "\n",
    "    acc_nlp = []\n",
    "    nmi_nlp = []\n",
    "    cen_nlp = []\n",
    "\n",
    "    acc_nlp_std = []\n",
    "    nmi_nlp_std = []\n",
    "    cen_nlp_std = []\n",
    "    \n",
    "    method_names = []\n",
    "    for nlp_type in ['textrank','centroid','lsa']:\n",
    "        cur_results = results_summary[data][nlp_type][emb_type]['5-1']\n",
    "        acc_nlp.append(cur_results[0])\n",
    "        nmi_nlp.append(cur_results[1])\n",
    "        cen_nlp.append(cur_results[2])\n",
    "        cur_method = '\\\\quad \\\\emph{' + nlp_type + \"-single}\"\n",
    "\n",
    "        cur_results_std = results_summary_std[data][nlp_type][emb_type]['5-1']\n",
    "        acc_nlp_std.append(cur_results_std[0])\n",
    "        nmi_nlp_std.append(cur_results_std[1])\n",
    "        cen_nlp_std.append(cur_results_std[2])\n",
    "        \n",
    "        method_names.append(cur_method)\n",
    "\n",
    "        cur_results = results_summary[data][nlp_type][emb_type]['5-5']\n",
    "        acc_nlp.append(cur_results[0])\n",
    "        nmi_nlp.append(cur_results[1])\n",
    "        cen_nlp.append(cur_results[2])\n",
    "        cur_method = '\\\\quad \\\\emph{' + nlp_type + \"-multiple}\"\n",
    "\n",
    "        cur_results_std = results_summary_std[data][nlp_type][emb_type]['5-5']\n",
    "        acc_nlp_std.append(cur_results_std[0])\n",
    "        nmi_nlp_std.append(cur_results_std[1])\n",
    "        cen_nlp_std.append(cur_results_std[2])\n",
    "        \n",
    "        method_names.append(cur_method)\n",
    "        \n",
    "    acc = []\n",
    "    nmi = []\n",
    "    cen = []\n",
    "\n",
    "    acc_std = []\n",
    "    nmi_std = []\n",
    "    cen_std = []\n",
    "\n",
    "    for method in ['0-1','0-5','10-1','10-5']:\n",
    "        cur_results = results_summary[data]['gpt-4o'][emb_type][method]\n",
    "        acc.append(cur_results[0])\n",
    "        nmi.append(cur_results[1])\n",
    "        cen.append(cur_results[2])\n",
    "\n",
    "        cur_results_std = results_summary_std[data]['gpt-4o'][emb_type][method]\n",
    "        acc_std.append(cur_results_std[0])\n",
    "        nmi_std.append(cur_results_std[1])\n",
    "        cen_std.append(cur_results_std[2])\n",
    "        \n",
    "        if method == '10-1':\n",
    "            cur_method = '\\\\quad \\\\emph{FS-single}'\n",
    "        elif method == '10-5':\n",
    "            cur_method = '\\\\quad \\\\emph{FS-multiple}'\n",
    "        elif method == '0-1':\n",
    "            cur_method = '\\\\quad \\\\emph{single}'\n",
    "        elif method == '0-5':\n",
    "            cur_method = '\\\\quad \\\\emph{multiple}'\n",
    "        elif method == 'kmeans':\n",
    "            cur_method = 'k-means'\n",
    "        elif method == 'kmedoids':\n",
    "            cur_method = 'k-medoids'\n",
    "        method_names.append(cur_method)\n",
    "\n",
    "    # Find the maximum value\n",
    "    #val = max(acc)\n",
    "    #acc = [f\"{{\\\\bf {x}}}\" if x == val else x for x in acc]\n",
    "\n",
    "    #val = max(nmi)\n",
    "    #nmi = [f\"{{\\\\bf {x}}}\" if x == val else x for x in nmi]\n",
    "\n",
    "    #val = min(cen)\n",
    "    #cen = [f\"{{\\\\bf {x}}}\" if x == val else x for x in cen]\n",
    "    \n",
    "\n",
    "    acc_other = []\n",
    "    nmi_other = []\n",
    "    cen_other = []\n",
    "\n",
    "    acc_other_std = []\n",
    "    nmi_other_std = []\n",
    "    cen_other_std = []\n",
    "    \n",
    "    for other_method in ['kmeans','kmedoids','GMM','Agglomerative','Spectral']:\n",
    "        if 'km' in other_method:\n",
    "            cur_results = results_summary[data]['gpt-4o'][emb_type][other_method]\n",
    "            cur_results_std = results_summary_std[data]['gpt-4o'][emb_type][other_method]\n",
    "        else:\n",
    "            cur_results = results_summary[data][other_method][emb_type]\n",
    "            cur_results_std = results_summary_std[data][other_method][emb_type]\n",
    "        \n",
    "        acc_other.append(cur_results[0])\n",
    "        nmi_other.append(cur_results[1])\n",
    "        cen_other.append(cur_results[2])\n",
    "\n",
    "        acc_other_std.append(cur_results_std[0])\n",
    "        nmi_other_std.append(cur_results_std[1])\n",
    "        cen_other_std.append(cur_results_std[2])\n",
    "        print(acc_other_std)\n",
    "\n",
    "        if other_method == 'kmeans':\n",
    "            other_method = 'k-means'\n",
    "        elif other_method == 'kmedoids':\n",
    "            other_method = 'k-medoids'\n",
    "        method_names.append(other_method)\n",
    "\n",
    "    acc = acc_nlp + acc + acc_other\n",
    "    nmi = nmi_nlp + nmi + nmi_other\n",
    "    cen = cen_nlp + cen + cen_other\n",
    "\n",
    "    acc_std = acc_nlp_std + acc_std + acc_other_std\n",
    "    nmi_std = nmi_nlp_std + nmi_std + nmi_other_std\n",
    "    cen_std = cen_nlp_std + cen_std + cen_other_std\n",
    "\n",
    "    # Find the maximum value\n",
    "    val = max(acc)\n",
    "    acc = [f\"{{\\\\bf {x}}}\" if x == val else x for x in acc]\n",
    "\n",
    "    val = max(nmi)\n",
    "    nmi = [f\"{{\\\\bf {x}}}\" if x == val else x for x in nmi]\n",
    "\n",
    "    val = min(cen)\n",
    "    cen = [f\"{{\\\\bf {x}}}\" if x == val else x for x in cen]\n",
    "    \n",
    "    for ii in range(len(method_names)):\n",
    "        cur_method = method_names[ii]\n",
    "        if data == 'bank77':\n",
    "            line[emb_type][cur_method] = cur_method + '&' + str(acc[ii]) + '&' + str(nmi[ii])#+ '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "            line_std[emb_type][cur_method] = '&(' + str(acc_std[ii]) + ')&(' + str(nmi_std[ii]) + \")\" #+ '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "        else:\n",
    "            line[emb_type][cur_method] = line[emb_type][cur_method] + '&&' + str(acc[ii]) + '&' + str(nmi[ii])#+ '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "            line_std[emb_type][cur_method] = line_std[emb_type][cur_method] + '&&(' + str(acc_std[ii]) + ')&(' + str(nmi_std[ii]) + \")\"#+ '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "\n",
    "text = \"\"\n",
    "appendix = True\n",
    "\n",
    "for emb_type in ['openai']:\n",
    "    text = text + '\\\\hline\\n'\n",
    "    for ii in range(len(method_names)):\n",
    "        cur_method = method_names[ii]\n",
    "        if 'k-means' in cur_method:\n",
    "            text = text + '\\\\hline\\n'\n",
    "        text = text + line[emb_type][cur_method] + '\\\\\\\\\\n'\n",
    "        if appendix == True:\n",
    "            text = text + line_std[emb_type][cur_method] + '\\\\\\\\\\n'\n",
    "print(text) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 58,
   "id": "6185a1b6-df13-4531-bff2-bf3268841d44",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\quad \\emph{FS-single}\n"
     ]
    }
   ],
   "source": [
    "cur_method = '\\\\quad \\\\emph{FS-single}'\n",
    "print(cur_method)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3bbd5672-179e-4db3-8763-364372fee414",
   "metadata": {},
   "source": [
    "# Table including all embeddings, kmeans and kllmeans for gpt-4o"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "id": "f55b0cf5-1947-487d-8483-eb378e56fed2",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\hline\n",
      "\\emph{distilbert}&&&&&&&&&&&&\\\\\n",
      "\\quad kmeans&53.9&77.2&{\\bf 0.34}&&17.8&18.3&0.364&&44.4&45.1&0.309\\\\\n",
      "&(0.96)&(0.49)&(0.007)&&(0.86)&(0.67)&(0.005)&&(1.53)&(0.99)&(0.021)\\\\\n",
      "\\quad k-NLPmeans&52.9&77.3&0.353&&{\\bf 18.5}&18.2&0.365&&44.7&45.3&0.311\\\\\n",
      "&(0.25)&(0.22)&(0.003)&&(0.58)&(0.38)&(0.004)&&(2.44)&(1.22)&(0.02)\\\\\n",
      "\\quad k-LLMmeans&{\\bf 55.3}&{\\bf 78.7}&0.343&&18.2&{\\bf 18.8}&{\\bf 0.351}&&{\\bf 46.2}&{\\bf 46.4}&{\\bf 0.295}\\\\\n",
      "&(1.1)&(0.53)&(0.009)&&(0.52)&(0.73)&(0.004)&&(1.35)&(1.12)&(0.015)\\\\\n",
      "\\hline\n",
      "\\emph{text-embedding-3-small}&&&&&&&&&&&&\\\\\n",
      "\\quad kmeans&77.3&92.0&0.2&&20.7&20.5&0.287&&59.4&67.9&0.246\\\\\n",
      "&(1.83)&(0.35)&(0.014)&&(1.0)&(0.67)&(0.005)&&(4.03)&(1.67)&(0.015)\\\\\n",
      "\\quad k-NLPmeans&{\\bf 80.2}&92.9&{\\bf 0.173}&&22.3&20.2&0.29&&{\\bf 63.3}&70.0&{\\bf 0.227}\\\\\n",
      "&(0.98)&(0.41)&(0.006)&&(0.85)&(0.56)&(0.007)&&(3.06)&(1.02)&(0.018)\\\\\n",
      "\\quad k-LLMmeans&{\\bf 80.2}&{\\bf 93.1}&0.179&&{\\bf 24.2}&{\\bf 22.3}&{\\bf 0.278}&&63.2&{\\bf 70.6}&{\\bf 0.227}\\\\\n",
      "&(1.52)&(0.32)&(0.015)&&(1.16)&(0.67)&(0.011)&&(2.84)&(1.38)&(0.022)\\\\\n",
      "\\hline\n",
      "\\emph{e5-large}&&&&&&&&&&&&\\\\\n",
      "\\quad kmeans&73.8&90.8&0.131&&22.8&22.8&0.176&&58.4&63.7&0.138\\\\\n",
      "&(2.34)&(0.74)&(0.01)&&(0.92)&(0.73)&(0.003)&&(3.89)&(1.75)&(0.02)\\\\\n",
      "\\quad k-NLPmeans&76.5&92.0&{\\bf 0.119}&&22.6&22.6&0.179&&60.4&65.7&0.137\\\\\n",
      "&(1.76)&(0.58)&(0.009)&&(0.7)&(0.32)&(0.003)&&(3.2)&(1.79)&(0.008)\\\\\n",
      "\\quad k-LLMmeans&{\\bf 77.2}&{\\bf 92.5}&{\\bf 0.119}&&{\\bf 24.2}&{\\bf 24.3}&{\\bf 0.168}&&{\\bf 62.3}&{\\bf 65.9}&{\\bf 0.133}\\\\\n",
      "&(1.6)&(0.4)&(0.007)&&(0.76)&(0.7)&(0.003)&&(1.36)&(0.78)&(0.007)\\\\\n",
      "\\hline\n",
      "\\emph{sbert}&&&&&&&&&&&&\\\\\n",
      "\\quad kmeans&76.9&91.0&0.215&&13.7&13.3&0.355&&58.2&64.6&0.271\\\\\n",
      "&(1.63)&(0.5)&(0.013)&&(0.62)&(0.57)&(0.005)&&(2.03)&(1.09)&(0.023)\\\\\n",
      "\\quad k-NLPmeans&79.0&91.9&0.201&&14.1&12.8&0.363&&58.5&64.6&0.272\\\\\n",
      "&(1.65)&(0.31)&(0.017)&&(0.3)&(0.29)&(0.003)&&(2.24)&(1.29)&(0.022)\\\\\n",
      "\\quad k-LLMmeans&{\\bf 79.7}&{\\bf 92.5}&{\\bf 0.198}&&{\\bf 14.7}&{\\bf 13.9}&{\\bf 0.346}&&{\\bf 59.7}&{\\bf 65.6}&{\\bf 0.254}\\\\\n",
      "&(0.73)&(0.25)&(0.008)&&(0.55)&(0.5)&(0.004)&&(2.54)&(0.79)&(0.019)\\\\\n",
      "\n"
     ]
    }
   ],
   "source": [
    "line = {}\n",
    "line_std = {}\n",
    "llm_type = 'gpt-4o'\n",
    "nlp_type = 'lsa'\n",
    "for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "    line[emb_type] = {}\n",
    "    line_std[emb_type] = {}\n",
    "    \n",
    "for data in ['clinic', 'goemo' , 'massive_D']:\n",
    "\n",
    "    for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "\n",
    "        acc = []\n",
    "        nmi = []\n",
    "        cen = []\n",
    "\n",
    "        acc_std = []\n",
    "        nmi_std = []\n",
    "        cen_std = []\n",
    "        method_names = []\n",
    "        for method in ['kmeans','k-NLPmeans','10-5']:\n",
    "\n",
    "            if method == 'k-NLPmeans':\n",
    "                cur_results = results_summary[data][nlp_type][emb_type]['5-5']\n",
    "                cur_results_std = results_summary_std[data][nlp_type][emb_type]['5-5']\n",
    "            else:\n",
    "                cur_results = results_summary[data][llm_type][emb_type][method]\n",
    "                cur_results_std = results_summary_std[data][llm_type][emb_type][method]\n",
    "            acc.append(cur_results[0])\n",
    "            nmi.append(cur_results[1])\n",
    "            cen.append(cur_results[2])\n",
    "\n",
    "            acc_std.append(cur_results_std[0])\n",
    "            nmi_std.append(cur_results_std[1])\n",
    "            cen_std.append(cur_results_std[2])\n",
    "            if method == '10-5':\n",
    "                cur_method = '\\\\quad k-LLMmeans'\n",
    "            else:\n",
    "                cur_method = '\\\\quad ' + method\n",
    "            method_names.append(cur_method)\n",
    "\n",
    "        # Find the maximum value\n",
    "        val = max(acc)\n",
    "        acc = [f\"{{\\\\bf {x}}}\" if x == val else x for x in acc]\n",
    "\n",
    "        val = max(nmi)\n",
    "        nmi = [f\"{{\\\\bf {x}}}\" if x == val else x for x in nmi]\n",
    "\n",
    "        val = min(cen)\n",
    "        cen = [f\"{{\\\\bf {x}}}\" if x == val else x for x in cen]\n",
    "        \n",
    "        for ii in range(len(method_names)):\n",
    "            cur_method = method_names[ii]\n",
    "            if data == 'clinic':\n",
    "                line[emb_type][cur_method] = cur_method + '&' + str(acc[ii]) + '&' + str(nmi[ii]) + '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "                line_std[emb_type][cur_method] = '&(' + str(acc_std[ii]) + ')&(' + str(nmi_std[ii]) + ')&(' + str(cen_std[ii]) + \")\"# + '&' + str(cen[ii])\n",
    "            else:\n",
    "                line[emb_type][cur_method] = line[emb_type][cur_method] + '&&' + str(acc[ii]) + '&' + str(nmi[ii]) + '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "                line_std[emb_type][cur_method] = line_std[emb_type][cur_method] + '&&(' + str(acc_std[ii]) + ')&(' + str(nmi_std[ii]) + ')&(' + str(cen_std[ii]) + \")\"# + '&' + str(cen[ii])\n",
    "\n",
    "text = \"\"\n",
    "appendix = True\n",
    "\n",
    "for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "    if emb_type == 'openai':\n",
    "        cur_emb_type = 'text-embedding-3-small'\n",
    "    else:\n",
    "        cur_emb_type = emb_type\n",
    "    text = text + '\\\\hline\\n'\n",
    "    text = text + '\\\\emph{' + cur_emb_type + '}&&&&&&&&&&&&\\\\\\\\\\n'\n",
    "    for ii in range(len(method_names)):\n",
    "        cur_method = method_names[ii]\n",
    "        text = text + line[emb_type][cur_method] + '\\\\\\\\\\n'\n",
    "        if appendix == True:\n",
    "            text = text + line_std[emb_type][cur_method] + '\\\\\\\\\\n'\n",
    "print(text) "
   ]
  },
  {
   "cell_type": "markdown",
   "id": "25fd375f-2487-4350-ae2e-ee0015434704",
   "metadata": {},
   "source": [
    "# Table including all embeddings, kmeans and all k-llmmeans"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "473fc8c3-ff4d-443e-84cf-ffc43ab5019a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\hline\n",
      "\\multirow{6}{*}{\\rotatebox{90}{distilbert}}&k-means&64.4&{\\bf 0.335}&&77.2&{\\bf 0.34}&&18.3&0.364&&58.1&0.366&&45.1&0.309\\\\\n",
      "&k-medoids&56.0&0.591&&66.8&0.69&&14.0&0.769&&42.6&0.847&&27.2&0.81\\\\\n",
      "&k-LLMmeans 1-iter&64.8&0.351&&77.4&0.352&&18.3&0.358&&58.6&{\\bf 0.362}&&46.0&{\\bf 0.294}\\\\\n",
      "&k-LLMmeans 5-iter&64.8&0.358&&77.7&0.356&&18.3&0.354&&{\\bf 59.0}&0.363&&45.6&0.306\\\\\n",
      "&k-LLMmeans FS 1-iter&64.8&0.352&&78.1&0.346&&{\\bf 18.9}&0.357&&58.8&0.365&&45.7&0.299\\\\\n",
      "&k-LLMmeans FS 5-iter&{\\bf 64.9}&0.363&&{\\bf 78.7}&0.343&&18.8&{\\bf 0.351}&&{\\bf 59.0}&{\\bf 0.362}&&{\\bf 46.4}&0.295\\\\\n",
      "\\hline\n",
      "\\multirow{6}{*}{\\rotatebox{90}{openai}}&k-means&83.0&0.225&&92.0&0.2&&20.5&0.287&&72.4&0.32&&67.9&0.246\\\\\n",
      "&k-medoids&69.5&0.639&&77.7&0.694&&15.9&0.852&&52.4&0.86&&38.8&0.797\\\\\n",
      "&k-LLMmeans 1-iter&83.6&0.221&&92.5&0.194&&{\\bf 22.3}&0.278&&73.0&0.314&&69.6&0.232\\\\\n",
      "&k-LLMmeans 5-iter&83.6&0.226&&92.8&0.186&&22.1&{\\bf 0.275}&&73.5&0.307&&69.5&0.238\\\\\n",
      "&k-LLMmeans FS 1-iter&83.8&{\\bf 0.219}&&92.8&0.186&&21.9&0.283&&73.6&0.314&&69.4&0.233\\\\\n",
      "&k-LLMmeans FS 5-iter&{\\bf 84.1}&0.22&&{\\bf 93.1}&{\\bf 0.179}&&{\\bf 22.3}&0.278&&{\\bf 73.9}&{\\bf 0.302}&&{\\bf 70.6}&{\\bf 0.227}\\\\\n",
      "\\hline\n",
      "\\multirow{6}{*}{\\rotatebox{90}{e5-large}}&k-means&76.7&0.142&&90.8&0.131&&22.8&0.176&&70.9&0.175&&63.7&0.138\\\\\n",
      "&k-medoids&64.5&0.331&&73.4&0.371&&15.7&0.447&&50.3&0.437&&36.3&0.405\\\\\n",
      "&k-LLMmeans 1-iter&78.6&0.138&&91.6&0.127&&23.4&0.176&&72.0&0.17&&64.8&0.134\\\\\n",
      "&k-LLMmeans 5-iter&79.0&0.136&&92.0&0.127&&23.7&0.174&&72.1&{\\bf 0.166}&&{\\bf 66.0}&{\\bf 0.131}\\\\\n",
      "&k-LLMmeans FS 1-iter&78.8&0.136&&91.7&0.127&&23.7&0.174&&71.6&0.173&&64.9&0.136\\\\\n",
      "&k-LLMmeans FS 5-iter&{\\bf 79.5}&{\\bf 0.134}&&{\\bf 92.5}&{\\bf 0.119}&&{\\bf 24.3}&{\\bf 0.168}&&{\\bf 72.4}&{\\bf 0.166}&&65.9&0.133\\\\\n",
      "\\hline\n",
      "\\multirow{6}{*}{\\rotatebox{90}{sbert}}&k-means&80.9&0.255&&91.0&0.215&&13.3&0.355&&70.7&0.344&&64.6&0.271\\\\\n",
      "&k-medoids&69.0&0.64&&78.5&0.68&&12.0&0.899&&54.6&0.817&&44.6&0.8\\\\\n",
      "&k-LLMmeans 1-iter&81.7&0.253&&91.6&0.215&&13.6&0.351&&71.2&0.334&&65.6&0.248\\\\\n",
      "&k-LLMmeans 5-iter&81.8&0.253&&91.9&0.21&&13.7&0.348&&71.5&{\\bf 0.325}&&65.2&0.25\\\\\n",
      "&k-LLMmeans FS 1-iter&82.0&{\\bf 0.246}&&91.8&0.208&&{\\bf 13.9}&0.348&&71.4&0.333&&{\\bf 66.2}&{\\bf 0.243}\\\\\n",
      "&k-LLMmeans FS 5-iter&{\\bf 82.2}&0.247&&{\\bf 92.5}&{\\bf 0.198}&&{\\bf 13.9}&{\\bf 0.346}&&{\\bf 71.9}&0.337&&65.6&0.254\\\\\n",
      "\n"
     ]
    }
   ],
   "source": [
    "line = {}\n",
    "llmty\n",
    "for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "    line[emb_type] = {}\n",
    "    \n",
    "for data in ['bank77', 'clinic', 'goemo' , 'massive_I', 'massive_D']:\n",
    "\n",
    "    for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "\n",
    "        acc = []\n",
    "        nmi = []\n",
    "        cen = []\n",
    "        method_names = []\n",
    "        for method in ['kmeans','kmedoids','0-1','0-5','10-1','10-5']:\n",
    "            cur_results = results_summary[data][emb_type][method]\n",
    "            acc.append(cur_results[0])\n",
    "            nmi.append(cur_results[1])\n",
    "            cen.append(cur_results[2])\n",
    "            if method == '10-1':\n",
    "                cur_method = 'k-LLMmeans FS 1-iter'\n",
    "            elif method == '10-5':\n",
    "                cur_method = 'k-LLMmeans FS 5-iter'\n",
    "            elif method == '0-1':\n",
    "                cur_method = 'k-LLMmeans 1-iter'\n",
    "            elif method == '0-5':\n",
    "                cur_method = 'k-LLMmeans 5-iter'\n",
    "            elif method == 'kmeans':\n",
    "                cur_method = 'k-means'\n",
    "            elif method == 'kmedoids':\n",
    "                cur_method = 'k-medoids'\n",
    "            method_names.append(cur_method)\n",
    "\n",
    "        # Find the maximum value\n",
    "        val = max(acc)\n",
    "        acc = [f\"{{\\\\bf {x}}}\" if x == val else x for x in acc]\n",
    "\n",
    "        val = max(nmi)\n",
    "        nmi = [f\"{{\\\\bf {x}}}\" if x == val else x for x in nmi]\n",
    "\n",
    "        val = min(cen)\n",
    "        cen = [f\"{{\\\\bf {x}}}\" if x == val else x for x in cen]\n",
    "        \n",
    "        for ii in range(len(method_names)):\n",
    "            cur_method = method_names[ii]\n",
    "            if data == 'bank77':\n",
    "                if cur_method == 'k-means':\n",
    "                    line[emb_type][cur_method] = '\\\\multirow{6}{*}{\\\\rotatebox{90}{' + emb_type + '}}' + '&' + cur_method + '&' + str(nmi[ii]) + '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "                else:\n",
    "                    line[emb_type][cur_method] = '&' + cur_method + '&' + str(nmi[ii]) + '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "            else:\n",
    "                line[emb_type][cur_method] = line[emb_type][cur_method] + '&&' + str(nmi[ii]) + '&' + str(cen[ii])# + '&' + str(cen[ii])\n",
    "\n",
    "text = \"\"\n",
    "for emb_type in ['distilbert', 'openai','e5-large', 'sbert']:\n",
    "    text = text + '\\\\hline\\n'\n",
    "    for ii in range(len(method_names)):\n",
    "        cur_method = method_names[ii]\n",
    "        text = text + line[emb_type][cur_method] + '\\\\\\\\\\n'\n",
    "print(text)          "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 117,
   "id": "84a88d00-f260-480e-85e1-570bcd13b131",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['k-LLMmeans', 'k-LLMmeans']"
      ]
     },
     "execution_count": 117,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "method_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6baeb544-5fe8-4736-82c9-d59293616323",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python [conda env:base] *",
   "language": "python",
   "name": "conda-base-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
