{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {
    "tags": []
   },
   "source": [
    "# Rank Aggregation for Mix Instruct"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "from rpy2.robjects.packages import importr\n",
    "from rpy2.robjects import numpy2ri\n",
    "import pickle5 as pickle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "numpy2ri.activate()\n",
    "rankaggreg = importr('RankAggreg')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "def aggregate_ordered_lists(x, \n",
    "                            k,\n",
    "                            importance,\n",
    "                            method='CE',\n",
    "                            distance='Spearman',\n",
    "                            seed=0,\n",
    "                            verbose=False):\n",
    "    \n",
    "    x_array          = np.array(x)\n",
    "    importance_array = np.array(importance)\n",
    "    \n",
    "    results      = rankaggreg.RankAggreg(x=x_array,\n",
    "                                         k=k, \n",
    "                                         method=method, \n",
    "                                         distance=distance, \n",
    "                                         importance=importance_array, \n",
    "                                         seed=seed,\n",
    "                                         verbose=verbose)\n",
    "    return results"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Mix Instruct Test All Metrics"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### First Order"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "with open('ranked_lists_fo_mix_instruct_test.pickle', 'rb') as handle:\n",
    "    ranked_lists_fo = pickle.load(handle)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "x = np.array(ranked_lists_fo)\n",
    "k  = x.shape[1]\n",
    "importance = np.ones(x.shape[0])\n",
    "# importance = [8,5,7,7]\n",
    "results = aggregate_ordered_lists(x, k, importance=importance)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['oasst-sft-4-pythia-12b-epoch-3.5', 'alpaca-native', 'chatglm-6b', 'vicuna-13b-1.1', 'llama-7b-hf-baize-lora-bf16', 'koala-7B-HF', 'moss-moon-003-sft', 'flan-t5-xxl', 'mpt-7b-instruct', 'dolly-v2-12b', 'stablelm-tuned-alpha-7b', 'mpt-7b']\n",
      "----------------------------------------------------------------------------------------------------\n",
      "[('oasst-sft-4-pythia-12b-epoch-3.5', 1), ('alpaca-native', 2), ('chatglm-6b', 3), ('vicuna-13b-1.1', 4), ('llama-7b-hf-baize-lora-bf16', 5), ('koala-7B-HF', 6), ('moss-moon-003-sft', 7), ('flan-t5-xxl', 8), ('mpt-7b-instruct', 9), ('dolly-v2-12b', 10), ('stablelm-tuned-alpha-7b', 11), ('mpt-7b', 12)]\n"
     ]
    }
   ],
   "source": [
    "optimal_list = list(results[0])\n",
    "print(optimal_list)\n",
    "print(\"-\"*100)\n",
    "print(list(zip(optimal_list,range(1,len(optimal_list)+1))))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "##### Second Order"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "with open('ranked_lists_so_mix_instruct_test.pickle', 'rb') as handle:\n",
    "    ranked_lists_so = pickle.load(handle)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "x_so = np.array(ranked_lists_so)\n",
    "k  = x_so.shape[1]\n",
    "importance = np.ones(x_so.shape[0])\n",
    "# importance = [8,5,7,7]\n",
    "results_so = aggregate_ordered_lists(x_so, k, importance=importance)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['oasst-sft-4-pythia-12b-epoch-3.5', 'alpaca-native', 'chatglm-6b', 'vicuna-13b-1.1', 'llama-7b-hf-baize-lora-bf16', 'moss-moon-003-sft', 'koala-7B-HF', 'mpt-7b-instruct', 'dolly-v2-12b', 'stablelm-tuned-alpha-7b', 'mpt-7b', 'flan-t5-xxl']\n",
      "----------------------------------------------------------------------------------------------------\n",
      "[('oasst-sft-4-pythia-12b-epoch-3.5', 1), ('alpaca-native', 2), ('chatglm-6b', 3), ('vicuna-13b-1.1', 4), ('llama-7b-hf-baize-lora-bf16', 5), ('moss-moon-003-sft', 6), ('koala-7B-HF', 7), ('mpt-7b-instruct', 8), ('dolly-v2-12b', 9), ('stablelm-tuned-alpha-7b', 10), ('mpt-7b', 11), ('flan-t5-xxl', 12)]\n"
     ]
    }
   ],
   "source": [
    "optimal_list_so = list(results_so[0])\n",
    "print(optimal_list_so)\n",
    "print(\"-\"*100)\n",
    "print(list(zip(optimal_list_so,range(1,len(optimal_list_so)+1))))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Mean Risk Models"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "\n",
    "with open('ranked_lists_mean_risk_model_portfolio_mix_instruct_test.pickle', 'rb') as handle:\n",
    "    ranked_lists_mrm = pickle.load(handle)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "x_mrm = np.array(ranked_lists_mrm)\n",
    "k  = x_mrm.shape[1]\n",
    "importance = np.ones(x_mrm.shape[0])\n",
    "# importance = [8,5,7,7]\n",
    "results_mrm = aggregate_ordered_lists(x_mrm, k, importance=importance)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['oasst-sft-4-pythia-12b-epoch-3.5', 'chatglm-6b', 'alpaca-native', 'vicuna-13b-1.1', 'llama-7b-hf-baize-lora-bf16', 'koala-7B-HF', 'dolly-v2-12b', 'moss-moon-003-sft', 'mpt-7b-instruct', 'mpt-7b', 'stablelm-tuned-alpha-7b', 'flan-t5-xxl']\n",
      "----------------------------------------------------------------------------------------------------\n",
      "[('oasst-sft-4-pythia-12b-epoch-3.5', 1), ('chatglm-6b', 2), ('alpaca-native', 3), ('vicuna-13b-1.1', 4), ('llama-7b-hf-baize-lora-bf16', 5), ('koala-7B-HF', 6), ('dolly-v2-12b', 7), ('moss-moon-003-sft', 8), ('mpt-7b-instruct', 9), ('mpt-7b', 10), ('stablelm-tuned-alpha-7b', 11), ('flan-t5-xxl', 12)]\n"
     ]
    }
   ],
   "source": [
    "optimal_list_mrm = list(results_mrm[0])\n",
    "print(optimal_list_mrm)\n",
    "print(\"-\"*100)\n",
    "print(list(zip(optimal_list_mrm,range(1,len(optimal_list_mrm)+1))))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "tags": []
   },
   "source": [
    "##### p = 0.05"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "\n",
    "with open('ranked_lists_mean_risk_model_portfolio_mix_instruct_test_05.pickle', 'rb') as handle:\n",
    "    ranked_lists_mrm_05 = pickle.load(handle)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "x_mrm_05 = np.array(ranked_lists_mrm_05)\n",
    "k  = x_mrm_05.shape[1]\n",
    "importance = np.ones(x_mrm_05.shape[0])\n",
    "# importance = [8,5,7,7]\n",
    "results_mrm_05 = aggregate_ordered_lists(x_mrm_05, k, importance=importance)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['oasst-sft-4-pythia-12b-epoch-3.5', 'chatglm-6b', 'vicuna-13b-1.1', 'alpaca-native', 'llama-7b-hf-baize-lora-bf16', 'koala-7B-HF', 'dolly-v2-12b', 'moss-moon-003-sft', 'mpt-7b-instruct', 'mpt-7b', 'stablelm-tuned-alpha-7b', 'flan-t5-xxl']\n",
      "----------------------------------------------------------------------------------------------------\n",
      "[('oasst-sft-4-pythia-12b-epoch-3.5', 1), ('chatglm-6b', 2), ('vicuna-13b-1.1', 3), ('alpaca-native', 4), ('llama-7b-hf-baize-lora-bf16', 5), ('koala-7B-HF', 6), ('dolly-v2-12b', 7), ('moss-moon-003-sft', 8), ('mpt-7b-instruct', 9), ('mpt-7b', 10), ('stablelm-tuned-alpha-7b', 11), ('flan-t5-xxl', 12)]\n"
     ]
    }
   ],
   "source": [
    "optimal_list_mrm_05 = list(results_mrm_05[0])\n",
    "print(optimal_list_mrm_05)\n",
    "print(\"-\"*100)\n",
    "print(list(zip(optimal_list_mrm_05,range(1,len(optimal_list_mrm_05)+1))))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "tags": []
   },
   "source": [
    "#### Mean Risk Models All Metrics Gamma"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "\n",
    "with open('ranked_lists_mean_risk_model_all_metrics_gamma_test.pickle', 'rb') as handle:\n",
    "    ranked_lists_mrm_all_metrics = pickle.load(handle)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "x_mrm_all_metrics = np.array(ranked_lists_mrm_all_metrics)\n",
    "k  = x_mrm_all_metrics.shape[1]\n",
    "importance = np.ones(x_mrm_all_metrics.shape[0])\n",
    "# importance = [8,5,7,7]\n",
    "results_mrm_all_metrics = aggregate_ordered_lists(x_mrm_all_metrics, k, importance=importance)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['oasst-sft-4-pythia-12b-epoch-3.5', 'alpaca-native', 'chatglm-6b', 'vicuna-13b-1.1', 'llama-7b-hf-baize-lora-bf16', 'moss-moon-003-sft', 'koala-7B-HF', 'mpt-7b-instruct', 'dolly-v2-12b', 'mpt-7b', 'stablelm-tuned-alpha-7b', 'flan-t5-xxl']\n",
      "----------------------------------------------------------------------------------------------------\n",
      "[('oasst-sft-4-pythia-12b-epoch-3.5', 1), ('alpaca-native', 2), ('chatglm-6b', 3), ('vicuna-13b-1.1', 4), ('llama-7b-hf-baize-lora-bf16', 5), ('moss-moon-003-sft', 6), ('koala-7B-HF', 7), ('mpt-7b-instruct', 8), ('dolly-v2-12b', 9), ('mpt-7b', 10), ('stablelm-tuned-alpha-7b', 11), ('flan-t5-xxl', 12)]\n"
     ]
    }
   ],
   "source": [
    "optimal_list_mrm_all_metrics = list(results_mrm_all_metrics[0])\n",
    "print(optimal_list_mrm_all_metrics)\n",
    "print(\"-\"*100)\n",
    "print(list(zip(optimal_list_mrm_all_metrics,range(1,len(optimal_list_mrm_all_metrics)+1))))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Mean Win Rate"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "with open('MeanWinRate', 'rb') as handle:\n",
    "    ranked_lists_mwr = pickle.load(handle)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "x_mwr = np.array(list(ranked_lists_mwr.values()))\n",
    "k  = x.shape[1]\n",
    "importance = np.ones(x.shape[0])\n",
    "# importance = [8,5,7,7]\n",
    "results_mwr = aggregate_ordered_lists(x_mwr, k, importance=importance)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['oasst-sft-4-pythia-12b-epoch-3.5', 'alpaca-native', 'vicuna-13b-1.1', 'chatglm-6b', 'flan-t5-xxl', 'koala-7B-HF', 'stablelm-tuned-alpha-7b', 'llama-7b-hf-baize-lora-bf16', 'moss-moon-003-sft', 'dolly-v2-12b', 'mpt-7b-instruct', 'mpt-7b']\n",
      "----------------------------------------------------------------------------------------------------\n",
      "[('oasst-sft-4-pythia-12b-epoch-3.5', 1), ('alpaca-native', 2), ('vicuna-13b-1.1', 3), ('chatglm-6b', 4), ('flan-t5-xxl', 5), ('koala-7B-HF', 6), ('stablelm-tuned-alpha-7b', 7), ('llama-7b-hf-baize-lora-bf16', 8), ('moss-moon-003-sft', 9), ('dolly-v2-12b', 10), ('mpt-7b-instruct', 11), ('mpt-7b', 12)]\n"
     ]
    }
   ],
   "source": [
    "optimal_list_mwr = list(results_mwr[0])\n",
    "print(optimal_list_mwr)\n",
    "print(\"-\"*100)\n",
    "print(list(zip(optimal_list_mwr,range(1,len(optimal_list_mwr)+1))))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
