{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Plot histogram"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import torch\n",
    "import pandas as pd\n",
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "absolute_path = \"/\".join(os.path.abspath(os.getcwd()).split('/')[:-2])\n",
    "absolute_path"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "sys.path.append(absolute_path)\n",
    "\n",
    "from utils.experiments import visualization, df_analysis"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "eval_path = 'logs/eval_models'\n",
    "path_to_save = os.path.join(absolute_path, 'experiments/dump_results')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sim_mx_logs = 'logs/similarity_matrix/efficient_pnka/topk_landmarks_from_trainset'\n",
    "arch1 = 'r18'\n",
    "arch2 = arch1\n",
    "layer = 'l17'\n",
    "dataset = 'cifar10'\n",
    "\n",
    "seeds_even = np.array([0,0,1])\n",
    "seeds_odd = np.array([1,2,2])\n",
    "seeds_even, seeds_odd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "input_data = f'{dataset}_testset'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "nb_landmarks = 1000"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sims = []\n",
    "cka_sims = []\n",
    "folder_names = []\n",
    "all_preds = []\n",
    "all_agree_preds = []\n",
    "all_correct_preds = []\n",
    "processed_model_names = []\n",
    "\n",
    "for idx, (seed1,seed2) in enumerate(zip(seeds_even, seeds_odd)):\n",
    "    print(seed1, seed2)\n",
    "    model_name1 = f'{dataset}-{arch1}-seed{seed1}'\n",
    "    model_name2 = f'{dataset}-{arch2}-seed{seed2}'\n",
    "    \n",
    "    sim_mx_folder = f'M1_{model_name1}_{layer}_M2_{model_name2}_{layer}'\n",
    "    folder_names.append(f'{seed1}_{seed2}')\n",
    "    sim_mx = torch.load(\n",
    "        os.path.join(\n",
    "            absolute_path, sim_mx_logs, sim_mx_folder, input_data, 'pnka.pt'))\n",
    "    cka_mx = torch.load(\n",
    "        os.path.join(\n",
    "            absolute_path, 'logs/similarity_matrix/cka/', sim_mx_folder, input_data,'final_sim_xxtyyt.pt'))\n",
    "    norm = torch.load(\n",
    "        os.path.join(\n",
    "            absolute_path, 'logs/similarity_matrix/cka/', sim_mx_folder, input_data,'norm.pt'))\n",
    "    cka_sims.append(torch.trace(cka_mx)/norm)\n",
    "#     sim = torch.diag(sim_mx)\n",
    "    sims.append(sim_mx)\n",
    "\n",
    "    preds1 = torch.load(\n",
    "        os.path.join(\n",
    "            absolute_path, eval_path, model_name1, 'preds.pt'))\n",
    "    labels1 = torch.load(\n",
    "        os.path.join(\n",
    "            absolute_path, eval_path, model_name1, 'labels.pt'))\n",
    "    if model_name1 not in processed_model_names:\n",
    "        processed_model_names.append(model_name1)\n",
    "        all_preds.append(preds1)\n",
    "        all_correct_preds.append(torch.eq(preds1, labels1).int())\n",
    "\n",
    "    preds2 = torch.load(\n",
    "        os.path.join(\n",
    "            absolute_path, eval_path, model_name2, 'preds.pt'))\n",
    "    labels2 = torch.load(\n",
    "        os.path.join(\n",
    "            absolute_path, eval_path, model_name2, 'labels.pt'))\n",
    "    if not torch.equal(labels1, labels2):\n",
    "        break\n",
    "    if model_name2 not in processed_model_names:\n",
    "        processed_model_names.append(model_name2)\n",
    "        all_preds.append(preds2)\n",
    "        all_correct_preds.append(torch.eq(preds2, labels1).int())\n",
    "\n",
    "    all_agree_preds.append(torch.eq(preds1, preds2).int())\n",
    "\n",
    "\n",
    "sims = torch.stack(sims)\n",
    "all_preds = torch.stack(all_preds)\n",
    "all_agree_preds = torch.stack(all_agree_preds)\n",
    "all_correct_preds = torch.stack(all_correct_preds)\n",
    "cka_sims = torch.stack(cka_sims)\n",
    "sims.shape, cka_sims.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = {}\n",
    "for folder_name, sim in zip(folder_names, sims):\n",
    "    data[folder_name] = sim\n",
    "df = pd.DataFrame(data)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg = df.mean(axis=1)\n",
    "std = df.std(axis=1)\n",
    "df['avg'] = avg\n",
    "df['std'] = std"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "max(df['std']), min(df['std']), df['std'].mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def all_same(items):\n",
    "    return all(x == items[0] for x in items)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "correctness = []\n",
    "for idx, (correct) in enumerate(all_correct_preds.T):\n",
    "    if all_same(correct):\n",
    "        correctness.append(1)\n",
    "    else:\n",
    "        correctness.append(0)\n",
    "correctness = torch.tensor(correctness)\n",
    "correctness.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "agreeableness = []\n",
    "for idx, (preds) in enumerate(all_preds.T):\n",
    "#     print(preds, all_same(preds))\n",
    "    if all_same(preds):\n",
    "        agreeableness.append(1)\n",
    "    else:\n",
    "        agreeableness.append(0)\n",
    "agreeableness = torch.tensor(agreeableness)\n",
    "agreeableness.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for idx, (seed1,seed2) in enumerate(zip(seeds_even, seeds_odd)):\n",
    "    df[f'agree_{seed1}_{seed2}'] = all_agree_preds[idx]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df['all_agreeableness'] = agreeableness"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df['all_correct'] = correctness"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df['ratio_agree_preds'] = df[['agree_0_1','agree_0_2','agree_1_2']].mean(axis=1)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "cka_score = torch.mean(cka_sims)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sim_agree = df[df['all_correct'] == 1]['avg']\n",
    "sim_disagree = df[df['all_correct'] != 1]['avg']\n",
    "sim_agree.shape, sim_disagree.shape"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Overall Histogram"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "filename = os.path.join(path_to_save, f'hist_bycorrectness_{dataset}-{arch1}-{layer}_avgoverdiffseeds_nbinsx10_top{nb_landmarks}balancedlandmarksfromtrain.pdf')\n",
    "filename"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "visualization.plot_histogram(\n",
    "#     all_x=[df['avg']],\n",
    "    all_x=[sim_agree, sim_disagree],\n",
    "    all_names=['Same Prediction', 'Different Prediction'],\n",
    "    histnorm='percent',\n",
    "#     histfunc='sum',\n",
    "    yaxis_title_text='Percentage of Points',\n",
    "    xaxis_title_text='Average PNKA',\n",
    "    nbinsx=10,\n",
    "    yrange=[0,100],\n",
    "    xrange=[0.,1],\n",
    "#     xaxis=dict(\n",
    "#         dtick=0.1,\n",
    "#         linecolor = \"black\"),\n",
    "    xaxis = dict(\n",
    "        dtick=0.1,\n",
    "        linecolor = \"black\",\n",
    "        spikedash = 'solid',\n",
    "        showgrid=True,\n",
    "        gridcolor='lightgrey',\n",
    "    ),\n",
    "#     yaxis=dict(\n",
    "#             linecolor = \"black\",),\n",
    "    yaxis = dict(\n",
    "        linecolor = \"black\",\n",
    "        spikedash = 'solid',\n",
    "        showgrid=True,\n",
    "        gridcolor='lightgrey',\n",
    "    ),\n",
    "    font=dict(\n",
    "        family=\"Times New Roman\",\n",
    "        size=23,\n",
    "        color=\"Black\"\n",
    "    ),\n",
    "    legend=dict(\n",
    "        yanchor=\"top\",\n",
    "        y=0.99,\n",
    "        xanchor=\"left\",\n",
    "        x=0.01,\n",
    "        title_font_family=\"Times New Roman\",\n",
    "        font=dict(size= 25)\n",
    "    ),\n",
    "#     save_path=filename,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import plotly.express as px\n",
    "COLORS = px.colors.qualitative.Plotly\n",
    "COLORS[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "range_points = int(len(df) / 10)\n",
    "total_bins = int(len(df) / range_points)\n",
    "total_bins"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ascending = True\n",
    "df_sorted = df.sort_values('avg', ascending=ascending)\n",
    "df_sorted = df_sorted.reset_index()\n",
    "df_sorted"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "split_df = []\n",
    "agree_split_df = []\n",
    "notagree_split_df = []\n",
    "\n",
    "avg_pnka, std_pnka = [], []\n",
    "agree_percentage_per_bin = []\n",
    "notagree_percentage_per_bin = []\n",
    "\n",
    "for bin_idx in range(total_bins):\n",
    "    partial_df_sorted = df_sorted.iloc[bin_idx*range_points:(bin_idx*range_points)+range_points]\n",
    "    partial_df_agree = partial_df_sorted[partial_df_sorted['all_correct'] == 1] # perturbed\n",
    "    partial_df_notagree = partial_df_sorted[partial_df_sorted['all_correct'] == 0]\n",
    "    print(len(partial_df_sorted), 'a', (len(partial_df_agree), len(partial_df_agree)/len(partial_df_sorted),\n",
    "                                  'na', len(partial_df_notagree),len(partial_df_notagree)/len(partial_df_sorted)))\n",
    "\n",
    "    agree_percentage_per_bin.append(len(partial_df_agree)/len(partial_df_sorted))\n",
    "    notagree_percentage_per_bin.append(len(partial_df_notagree)/len(partial_df_sorted))\n",
    "    avg_pnka.append(partial_df_sorted['avg'].mean())\n",
    "    std_pnka.append(partial_df_sorted['avg'].mean())\n",
    "#     split_df.append(partial_df_sorted)\n",
    "#     perturbed_split_df.append(partial_df_perturbed)\n",
    "#     notperturbed_split_df.append(partial_df_notperturbed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# range_for_plot = np.concatenate((np.arange(-0.95, 0.0, 0.1), np.arange(0.05, 1, 0.1)), 0)\n",
    "# range_for_plot, len(range_for_plot)\n",
    "range_for_plot = np.arange(total_bins)\n",
    "range_for_plot, len(range_for_plot)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "filename = os.path.join(path_to_save, f'hist_bycorrectness_ranking_{dataset}-{arch1}-{layer}_avgoverdiffseeds_nbinsx10_top{nb_landmarks}balancedlandmarksfromtrain.pdf')\n",
    "filename"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import plotly.graph_objects as go\n",
    "\n",
    "fig = go.Figure(data=[\n",
    "    go.Bar(name='Correct Prediction',\n",
    "           x=range_for_plot,\n",
    "           y=agree_percentage_per_bin,\n",
    "           marker_color=COLORS[0]),\n",
    "    go.Bar(name='Incorrect Prediction',\n",
    "           x=range_for_plot,\n",
    "           y=notagree_percentage_per_bin,\n",
    "           marker_color=COLORS[1]),\n",
    "])\n",
    "\n",
    "\n",
    "fig.update_layout(\n",
    "    xaxis_title_text=f'Ranking of PNKA score ({range_points} points in each bin)',\n",
    "    yaxis_title_text=f'Percentage',\n",
    "    barmode='stack',\n",
    "    yaxis = dict(\n",
    "        linecolor = \"black\",\n",
    "        spikedash = 'solid',\n",
    "        showgrid=True,\n",
    "        gridcolor='lightgrey'),\n",
    "    xaxis = dict(\n",
    "        linecolor = \"black\",\n",
    "        spikedash = 'solid',\n",
    "        showgrid=True,\n",
    "        gridcolor='lightgrey',\n",
    "        tickmode = 'array',\n",
    "        tickvals = range_for_plot,\n",
    "#         ticktext = x_axis_names\n",
    "    ),\n",
    "    font=dict(\n",
    "            family=\"Times New Roman\",\n",
    "            size=23,\n",
    "            color=\"Black\"\n",
    "        ),\n",
    "    legend=dict(\n",
    "        orientation=\"h\",\n",
    "        yanchor=\"top\",\n",
    "        y=1.2,\n",
    "        xanchor=\"left\",\n",
    "        x=0.01\n",
    "    ),\n",
    "    paper_bgcolor='rgba(0,0,0,0)',\n",
    "    plot_bgcolor='rgba(0,0,0,0)',\n",
    ")\n",
    "fig.update_yaxes(range=[0, 1])\n",
    "\n",
    "\n",
    "for x_vline_idx, (x_vline_item, avg_score) in enumerate(zip(range_for_plot, avg_pnka)):\n",
    "    score = round(avg_score,3)\n",
    "    fig.add_vline(x=x_vline_item, line_width=2, line_dash='dash',\n",
    "                  line_color='black', annotation_text=str(score),\n",
    "                  annotation=dict(font_size=16, font_family=\"Times New Roman\"),\n",
    "                  annotation_position='top')\n",
    "\n",
    "fig.write_image(filename)\n",
    "print(f'Saved in {filename}')\n",
    "fig.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
