{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {
    "slideshow": {
     "slide_type": "-"
    }
   },
   "source": [
    "## Rank-Centrality Simulations\n",
    "\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Importing necessary libraries. They are mosty mathematical libraries and plotting libraries used but I have also imported a few more handy ones here. "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "slideshow": {
     "slide_type": "slide"
    }
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import scipy.stats as stats\n",
    "import matplotlib.pyplot as plt\n",
    "import math\n",
    "import string\n",
    "import random\n",
    "from scipy.linalg import eig \n",
    "np.random.seed(20)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "class RC_True_Weights:\n",
    "    \n",
    "    def __init__(self, n, bd, adj):\n",
    "        \n",
    "        self.n = n\n",
    "        self.bd = bd\n",
    "        self.A = adj\n",
    "        \n",
    "    def getP(self):\n",
    "        \n",
    "        mxdeg = self.n - 1\n",
    "        P = self.A / mxdeg\n",
    "        Ps = np.sum(P, axis = 1)\n",
    "        for i in range(self.n):\n",
    "            P[i,i] = 1 - Ps[i]\n",
    "        self.P = P\n",
    "\n",
    "    def get_stationary(self, Tr):\n",
    "        evals, evecs = np.linalg.eig(Tr.T)\n",
    "        evec1 = evecs[:,np.isclose(evals, 1)]\n",
    "        evec1 = evec1[:,0]\n",
    "        stationary = evec1 / evec1.sum()\n",
    "        stationary = stationary.real\n",
    "        return stationary\n",
    "    \n",
    "    def get_predicted_ws(self):\n",
    "        \n",
    "        self.getP()\n",
    "        prws = self.get_stationary(self.P)\n",
    "        self.predicted_wts = prws\n",
    "        return prws"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n = 10\n",
    "A = np.zeros((10,10))\n",
    "df = pd.read_csv('sushi.csv', header=None)\n",
    "prefs = df.to_numpy()\n",
    "sm = 0\n",
    "for i in range(len(prefs)):\n",
    "    mul = prefs[i,0]\n",
    "    for j in range(n):\n",
    "        for k in range(j+1,n):\n",
    "            A[prefs[i,k+1]-1, prefs[i,j+1]-1] += mul\n",
    "A = (A/5000)\n",
    "rc = RC_True_Weights(n, 0, A)\n",
    "wgts = rc.get_predicted_ws()\n",
    "print(\"The True Weights are:\")\n",
    "print(wgts)\n",
    "final_true_weights = wgts"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "debug = False\n",
    "\n",
    "class RC_Byz_flips:\n",
    "    \n",
    "    def __init__(self, n, good_file_name, byz_fr, stra, wgts):\n",
    "        \n",
    "        self.n = n\n",
    "        self.good_file_name = good_file_name\n",
    "        self.bf = byz_fr\n",
    "        self.stra = stra\n",
    "        self.weights = wgts\n",
    "        self.rnd_perm = 1 + np.random.permutation(self.n)\n",
    "        \n",
    "    def getA(self):\n",
    "        \n",
    "        A = np.zeros((self.n,self.n))\n",
    "        df = pd.read_csv(self.good_file_name, header=None)\n",
    "        prefs = df.to_numpy()\n",
    "        sm = 0\n",
    "        all_prefs = []\n",
    "        for i in range(len(prefs)):\n",
    "            mul = prefs[i,0]\n",
    "            sm += mul\n",
    "            for j in range(mul):\n",
    "                all_prefs.append(prefs[i,1:].tolist())\n",
    "        \n",
    "        bad_pref_count =(int)(sm * (self.bf / (1-self.bf)))\n",
    "        for i in range(bad_pref_count):\n",
    "            all_prefs.append(self.stra(self.rnd_perm))\n",
    "        \n",
    "        for x in all_prefs:\n",
    "            for j in range(self.n):\n",
    "                for k in range(j+1,self.n):\n",
    "                    A[x[k]-1, x[j]-1] += 1\n",
    "        \n",
    "        A /= len(all_prefs)\n",
    "        self.A = A\n",
    "        \n",
    "    def getP(self):\n",
    "        \n",
    "        self.getA()\n",
    "        mxdeg = self.n - 1\n",
    "        \n",
    "        P = self.A / mxdeg\n",
    "        Ps = np.sum(P, axis = 1)\n",
    "        for i in range(self.n):\n",
    "            P[i,i] = 1 - Ps[i]\n",
    "        self.P = P\n",
    "        \n",
    "    def get_stationary(self, Tr):\n",
    "        \n",
    "        evals, evecs = np.linalg.eig(Tr.T)\n",
    "        evec1 = evecs[:,np.isclose(evals, 1)]\n",
    "        evec1 = evec1[:,0]\n",
    "        stationary = evec1 / evec1.sum()\n",
    "        stationary = stationary.real\n",
    "        return stationary\n",
    "        \n",
    "\n",
    "    def norm(self, x):\n",
    "    \n",
    "        y = x*x\n",
    "        z = np.sum(y)\n",
    "        return z\n",
    "    \n",
    "    def get_error(self):\n",
    "        \n",
    "        df = self.predicted_wts - self.weights\n",
    "        return self.norm(df) / self.norm(self.weights)\n",
    "    \n",
    "    def get_predicted_ws(self):\n",
    "        \n",
    "        self.getP()\n",
    "        prws = self.get_stationary(self.P)\n",
    "        self.predicted_wts = prws\n",
    "        er = self.get_error()\n",
    "        kt, _ = stats.kendalltau(self.predicted_wts, self.weights)\n",
    "        return prws, er, kt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def opposite_vote(pr):\n",
    "    return [9,6,8,3,4,1,5,10,2,7]\n",
    "    \n",
    "def opposite_random_flips(pr):\n",
    "    st = [9,6,8,3,4,1,5,10,2,7]\n",
    "    cflips = 2\n",
    "    for i in range(cflips):\n",
    "        fl1 = (int)(10*random.random())\n",
    "        fl2 = (int)(10*random.random())\n",
    "        t1 = st[fl1]\n",
    "        st[fl1] = st[fl2]\n",
    "        st[fl2] = t1\n",
    "    return st\n",
    "\n",
    "def fixed_order_vote(pr):\n",
    "    return pr"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n = 10\n",
    "bf = [x/20 for x in range(10)]\n",
    "all_f = [fixed_order_vote,opposite_vote,opposite_random_flips]\n",
    "all_str = [\"fixed_order_vote\",\"opposite_vote\", \"opposite_random_flips\"]\n",
    "res = [[] for i in range(len(all_f))]\n",
    "res_kt = [[] for i in range(len(all_f))]\n",
    "num_iter = 10\n",
    "\n",
    "for i in range(len(all_f)):\n",
    "    for byz_fr in bf:\n",
    "        sme = 0\n",
    "        smkt = 0\n",
    "        for ite in range(num_iter):\n",
    "            rc = RC_Byz_flips(n, 'sushi.csv', byz_fr, all_f[i], final_true_weights)\n",
    "            _, err, kt = rc.get_predicted_ws()\n",
    "            sme += math.sqrt(err)\n",
    "            smkt += kt\n",
    "        sme /= num_iter\n",
    "        smkt /= num_iter\n",
    "        res[i].append(sme)\n",
    "        res_kt[i].append(smkt)\n",
    "        print(byz_fr, sme, smkt)\n",
    "    plt.plot(bf, res[i], label = all_str[i])\n",
    "    \n",
    "plt.xlabel(\"Byzantine Fraction\")\n",
    "plt.ylabel(\"L2 Error\")\n",
    "plt.legend()\n",
    "plt.show()\n",
    "\n",
    "for i in range(len(all_f)):\n",
    "    plt.plot(bf, res_kt[i], label = all_str[i])\n",
    "    \n",
    "plt.xlabel(\"Byzantine Fraction\")\n",
    "plt.ylabel(\"Kendall-Tau Correlation\")\n",
    "plt.legend()\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(len(all_f)):\n",
    "    plt.plot(bf[:5], res[i][:5], label = all_str[i])\n",
    "    \n",
    "plt.xlabel(\"Byzantine Fraction\")\n",
    "plt.ylabel(r\"$L_2$ Score\")\n",
    "plt.legend()\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('res_sushi_rc.npy', 'wb') as f:\n",
    "    np.save(f, res)\n",
    "\n",
    "with open('res_kt_sushi_rc.npy', 'wb') as f:\n",
    "    np.save(f, res_kt)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(res)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(res_kt)"
   ]
  }
 ],
 "metadata": {
  "celltoolbar": "Slideshow",
  "colab": {
   "name": "Untitled4.ipynb",
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
