{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import scipy.stats as stats\n",
    "from scipy.stats import wasserstein_distance\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import os\n",
    "import csv\n",
    "from collections import defaultdict\n",
    "from scipy.stats import ttest_1samp\n",
    "from statistics import mean"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_groups(bias_type):\n",
    "\n",
    "    if \"acquiescence\" in bias_type:\n",
    "        first_group = \"pos alpha\"\n",
    "        second_group = \"orig alpha\"\n",
    "        first_options=['a']\n",
    "        second_options = first_options\n",
    "    elif \"response_order\" in bias_type:\n",
    "        first_group = \"orig alpha\"\n",
    "        second_group = \"reversed alpha\"\n",
    "        first_options=['a']\n",
    "        second_options = first_options\n",
    "    elif \"odd_even\" in bias_type:\n",
    "        first_group = \"no middle alpha\"\n",
    "        second_group = \"middle alpha\"\n",
    "        first_options =['b','d']\n",
    "        second_options = first_options\n",
    "    elif \"opinion_float\" in bias_type:\n",
    "        first_group = \"orig alpha\"\n",
    "        second_group = \"float alpha\"\n",
    "        first_options=['c']\n",
    "        second_options = first_options\n",
    "    elif \"negative_wording\" in bias_type:\n",
    "        first_group = \"orig alpha\"\n",
    "        second_group = \"forbid alpha\"\n",
    "        first_options=['a']\n",
    "        \n",
    "        if 'key_typo' in bias_type or 'middle_random' in bias_type or 'letter_swap' in bias_type:\n",
    "            second_options = ['a']\n",
    "        else:\n",
    "            second_options=['b']\n",
    "    else:\n",
    "        raise ValueError(f\"Invalid bias type: {bias_type}\")\n",
    "        \n",
    "    assert len(first_options) == len(second_options)\n",
    "        \n",
    "    return first_group, second_group, first_options, second_options"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def run_stat_test(model, bias_type):\n",
    "    \n",
    "    root = 'results/'+model+'/csv'\n",
    "    \n",
    "    if 'key_typo' in bias_type or 'middle_random' in bias_type or 'letter_swap' in bias_type:\n",
    "        file = bias_type+'.csv' \n",
    "    elif model == 'llama2-7b' or model == 'llama2-13b' or model=='llama2-70b' or model =='gpt-3.5-turbo-instruct'\\\n",
    "    or 'ext_gen' in model or model == 'llama2-70b-chat':\n",
    "        file = bias_type+'.csv'\n",
    "    else:\n",
    "        file = bias_type+'-sample.csv'\n",
    "    \n",
    "    scores = {}\n",
    "    original = defaultdict(lambda:0)\n",
    "    \n",
    "    with open(os.path.join(root, file), newline='') as csvfile:\n",
    "        reader = csv.DictReader(csvfile)\n",
    "        first_group, second_group, first_options, second_options = get_groups(file)\n",
    "        for row in reader:\n",
    "            \n",
    "            if row[\"key\"] not in scores:\n",
    "                scores[row[\"key\"]] = 0\n",
    "\n",
    "            if row[\"group\"] == first_group and row[\"response\"] in first_options:\n",
    "                scores[row[\"key\"]] += 1\n",
    "                original[row[\"key\"]] += 1\n",
    "            if row[\"group\"] == second_group and row[\"response\"] in second_options:\n",
    "                scores[row[\"key\"]] += -1\n",
    "            \n",
    "    values = list(scores.values())\n",
    "    values = [value/50*100 for value in values]\n",
    "    \n",
    "    og_values = list(original.values())\n",
    "    og_values = [value/50*100 for value in og_values]\n",
    "    \n",
    "    p_value = ttest_1samp(values, 0)[1]\n",
    "    \n",
    "    return mean(og_values), mean(values), p_value\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def run_stat_test_orig(model, bias_type, keys):\n",
    "    \n",
    "    root = 'results/'+model+'/csv'\n",
    "    \n",
    "    if 'key_typo' in bias_type or 'middle_random' in bias_type or 'letter_swap' in bias_type:\n",
    "        file = bias_type+'.csv' \n",
    "    elif model == 'llama2-7b' or model == 'llama2-13b' or model=='llama2-70b' or model =='gpt-3.5-turbo-instruct'\\\n",
    "    or 'ext_gen' in model or model == 'llama2-70b-chat':\n",
    "        file = bias_type+'.csv'\n",
    "    else:\n",
    "        file = bias_type+'-sample.csv'\n",
    "    \n",
    "    scores = {}\n",
    "    original = defaultdict(lambda:0)\n",
    "    \n",
    "    with open(os.path.join(root, file), newline='') as csvfile:\n",
    "        reader = csv.DictReader(csvfile)\n",
    "        first_group, second_group, first_options, second_options = get_groups(file)\n",
    "        for row in reader:\n",
    "            \n",
    "            if row[\"key\"] in keys:\n",
    "            \n",
    "                if row[\"key\"] not in scores:\n",
    "                    scores[row[\"key\"]] = 0\n",
    "\n",
    "                if row[\"group\"] == first_group and row[\"response\"] in first_options:\n",
    "                    scores[row[\"key\"]] += 1\n",
    "                    original[row[\"key\"]] += 1\n",
    "                if row[\"group\"] == second_group and row[\"response\"] in second_options:\n",
    "                    scores[row[\"key\"]] += -1\n",
    "            \n",
    "    values = list(scores.values())\n",
    "    values = [value/50*100 for value in values]\n",
    "    \n",
    "    og_values = list(original.values())\n",
    "    og_values = [value/50*100 for value in og_values]\n",
    "    \n",
    "    p_value = ttest_1samp(values, 0)[1]\n",
    "    \n",
    "    return mean(og_values), mean(values), p_value\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_qs(model, bias_type):\n",
    "    \n",
    "    root = 'results/'+model+'/csv'\n",
    "    \n",
    "    if 'key_typo' in bias_type or 'middle_random' in bias_type or 'letter_swap' in bias_type:\n",
    "        file = bias_type+'.csv' \n",
    "    elif model == 'llama2-7b' or model == 'llama2-13b' or model=='llama2-70b' or model =='gpt-3.5-turbo-instruct'\\\n",
    "    or 'ext_gen' in model or model == 'llama2-70b-chat':\n",
    "        file = bias_type+'.csv'\n",
    "    else:\n",
    "        file = bias_type+'-sample.csv'\n",
    "    \n",
    "    scores = {}\n",
    "    original = defaultdict(lambda:0)\n",
    "    \n",
    "    with open(os.path.join(root, file), newline='') as csvfile:\n",
    "        reader = csv.DictReader(csvfile)\n",
    "        first_group, second_group, first_options, second_options = get_groups(file)\n",
    "        for row in reader:\n",
    "            \n",
    "            if row[\"key\"] not in scores:\n",
    "                scores[row[\"key\"]] = 0\n",
    "\n",
    "            if row[\"group\"] == first_group and row[\"response\"] in first_options:\n",
    "                scores[row[\"key\"]] += 1\n",
    "                original[row[\"key\"]] += 1\n",
    "            if row[\"group\"] == second_group and row[\"response\"] in second_options:\n",
    "                scores[row[\"key\"]] += -1\n",
    "            \n",
    "\n",
    "    \n",
    "    return scores.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def color_perturbation(val):\n",
    "    if val < 0.05:\n",
    "        color = 'background-color: yellow' \n",
    "    else:\n",
    "        color = \"\"\n",
    "    return color"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "models = ['gpt-3.5-turbo', 'gpt-3.5-turbo-instruct', 'llama2-7b', 'llama2-13b', 'llama2-70b', 'llama2-70b-chat', 'llama2-70b-ift']\n",
    "bias_types = ['acquiescence','response_order', 'odd_even', 'opinion_float', 'negative_wording']\n",
    "subset_bias_types = ['acquiescence-50','response_order-50', 'odd_even-50', 'opinion_float-50', 'negative_wording']\n",
    "perturbations = ['-key_typo', '-middle_random', '-letter_swap']\n",
    "clean_bias_labels = ['Acquiescence', 'Allow/forbid', 'Response Order', 'Opinion Float', 'Odd/even']\n",
    "\n",
    "\n",
    "all_results = []\n",
    "\n",
    "for model in models:\n",
    "    print(model)\n",
    "\n",
    "    for i in range(len(bias_types)):\n",
    "    \n",
    "        bias_type = bias_types[i]\n",
    "        \n",
    "        print(bias_type)\n",
    "        \n",
    "        original, diff, p_value = run_stat_test(model, bias_type)\n",
    "        lst = [model, clean_bias_labels[i], diff, p_value]\n",
    "        \n",
    "        for perturbation in perturbations:\n",
    "            \n",
    "            if subset_bias_types[i] == 'opinion_float-50': \n",
    "                bias_type = 'odd_even-50'+perturbation\n",
    "            else:\n",
    "                bias_type = subset_bias_types[i]+perturbation\n",
    "                \n",
    "            original, diff, p_value = run_stat_test(model, bias_type)\n",
    "            lst.append(diff)\n",
    "            lst.append(p_value)\n",
    "        \n",
    "        all_results.append(lst)\n",
    "\n",
    "\n",
    "df = pd.DataFrame(all_results, columns = ['model', 'bias type', 'modified', 'bias p value',\\\n",
    "                                          'key typo', 'key typo p value',\\\n",
    "                                          'middle random', 'middle random p value',\\\n",
    "                                          'letter swap', 'letter swap p value'])\n",
    "df = df.round(4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(df.round(4).to_latex(index=False, float_format=\"{:.4f}\".format))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "temp_df = df.drop(['baseline'], axis=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df.map(lambda x: len(str(x)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(df.to_latex(index=False, float_format=\"{:.4f}\".format))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import seaborn as sns\n",
    "import numpy as np\n",
    "np.bool = np.bool_\n",
    "\n",
    "#no subset\n",
    "\n",
    "models = ['llama2-7b', 'llama2-13b', 'llama2-70b', 'llama2-70b-ift', 'llama2-70b-chat', 'gpt-3.5-turbo', 'gpt-3.5-turbo-instruct']\n",
    "bias_types = ['acquiescence','negative_wording', 'response_order', 'opinion_float', 'odd_even']\n",
    "subset_bias_types = ['acquiescence-50','response_order-50', 'odd_even-50', 'opinion_float-50', 'negative_wording']\n",
    "perturbations = ['-key_typo', '-middle_random', '-letter_swap']\n",
    "exp_settings = ['modified', 'key typo', 'middle random', 'letter swap']\n",
    "clean_labels = ['bias', 'key typo', 'middle random', 'letter swap']\n",
    "clean_bias_labels = ['Acquiescence', 'Allow/forbid', 'Response Order', 'Opinion Float', 'Odd/even']\n",
    "clean_model_labels = ['Llama2-7b', 'Llama2-13b', 'Llama2-70b', 'Solar', 'Llama-70b-chat', '3.5 Turbo', '3.5 Turbo Instruct']\n",
    "\n",
    "# fig, axs = plt.subplots(2, len(models), figsize=(15,6), gridspec_kw={\"height_ratios\":[1, 0.025]})\n",
    "fig, axs = plt.subplots(1, len(models), figsize=(15,3))\n",
    "\n",
    "\n",
    "for i in range(len(models)):\n",
    "    \n",
    "    model = models[i]\n",
    "    \n",
    "    effect_data = np.zeros((len(bias_types),len(exp_settings)))\n",
    "    p_values = np.zeros((len(bias_types),len(exp_settings)))\n",
    "    \n",
    "    for k in range(len(exp_settings)):\n",
    "        for j in range(len(bias_types)):\n",
    "            \n",
    "            exp_setting = exp_settings[k]\n",
    "            \n",
    "            if exp_setting == 'modified':\n",
    "                p_val_col = 'bias p value'\n",
    "\n",
    "            elif exp_setting ==\"key typo\":\n",
    "                p_val_col = 'key typo p value'\n",
    "            \n",
    "            elif exp_setting == \"middle random\":\n",
    "                p_val_col = 'middle random p value'\n",
    "            \n",
    "            elif exp_setting == \"middle random\":\n",
    "                p_val_col = 'middle random p value'\n",
    "                                    \n",
    "            effect_size = df[(df['bias type'] == bias_types[j])\\\n",
    "                                            &(df['model']==model)][exp_setting]\n",
    "            p_value = df[(df['bias type'] == bias_types[j])\\\n",
    "                                            &(df['model']==model)][p_val_col]\n",
    "            \n",
    "            p_values[j][k] = p_value.item()\n",
    "            if p_value.item() < 0.05:\n",
    "                effect_data[j][k] = effect_size.item()/50 #\n",
    "            else:\n",
    "                effect_data[j][k] = np.nan\n",
    "\n",
    "    \n",
    "    if i == 0:\n",
    "        sns.heatmap(effect_data, ax=axs[i], cbar=False, cmap='RdBu', vmin=-1, vmax=1, linewidths=1, linecolor='gray')  \n",
    "        tickvalues1 = [num+0.5 for num in range(0,len(bias_types))]\n",
    "        axs[i].set_yticks(tickvalues1)\n",
    "        axs[i].set_yticklabels(clean_bias_labels, rotation=0)\n",
    "    elif i==len(models)-1:\n",
    "        temp = sns.heatmap(effect_data, yticklabels=False, ax=axs[i], cmap='RdBu', vmin=-1, vmax=1, linewidths=1, linecolor='gray') \n",
    "    else:\n",
    "        sns.heatmap(effect_data, yticklabels=False, cbar=False, ax=axs[i], cmap='RdBu', vmin=-1, vmax=1, linewidths=1, linecolor='gray')  \n",
    "\n",
    "    tickvalues = [num+0.5 for num in range(0,len(exp_settings))]\n",
    "    axs[i].set_xticks(tickvalues)\n",
    "    axs[i].set_xticklabels(clean_labels, rotation=90)\n",
    "    axs[i].set_title(clean_model_labels[i])\n",
    "        \n",
    "    zm = np.ma.masked_less(p_values, 0.05)\n",
    "            \n",
    "    x= np.arange(effect_data.shape[1]+1)\n",
    "    y= np.arange(effect_data.shape[0]+1)\n",
    "\n",
    "    axs[i].pcolor(x, y, zm, hatch='//', alpha=0.)\n",
    "\n",
    "#fig.colorbar(axs[0,i].get_children()[0], cax=axs[1,2:4], orientation=\"horizontal\")\n",
    "\n",
    "#plt.show()\n",
    "#pcm = axs[i].pcolormesh(np.random.random((20, 20)) * (col + 1),cmap=\"RdBu\")    \n",
    "#fig.colorbar(temp, ax=axs[i], shrink=0.6)   \n",
    "plt.savefig(\"perturbation.pdf\", format=\"pdf\", bbox_inches=\"tight\")\n",
    "\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
