{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# AD Statistics  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import cv2\n",
    "import csv\n",
    "import sys\n",
    "os.environ[\"HF_HOME\"] = \"../models\"\n",
    "\n",
    "import timm\n",
    "import torch\n",
    "import numpy as np\n",
    "from PIL import Image\n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib as mpl\n",
    "from typing import Dict, Any, Tuple\n",
    "import pandas as pd\n",
    "from utils import calculate_all_metrics, robustness_metrics, calculate_avg_exp_size, reapplied_loss, calculate_expected_mask, calculate_spectral_entropy, calculate_confidence_difference, robustness_metrics_images\n",
    "from torchvision.models import get_model, ResNet50_Weights\n",
    "from tqdm import tqdm\n",
    "from rex_xai.output.database import db_to_pandas\n",
    "\n",
    "from interpretable_resnet_torchvision import InterpretableResNet50\n",
    "from interpretable_regnety import InterpretableRegNetY\n",
    "\n",
    "from robustness_plot_code import create_figure\n",
    "\n",
    "dataset_path_IN_1k = \"../ImageNet-onek/IN-onek_data/Test\"\n",
    "dataset_path_CT_256 = '../CalTech-256/Dataset/exp_test'\n",
    "dataset_path_IN_1k_v2 = '../IN-1k_v2/Dataset'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Task 1: Calculate Robustness for all datasets together"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Full robustness dict\n",
    "#This will hold for every dataset, every model and every method the robustness metrics for every threshol\n",
    "robustness_dict = {}\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "thresholds_dirs = ['Threshold_0.9', 'Threshold_0.7', 'Threshold_0.5', 'Threshold_0.3', 'Threshold_0.1', 'Threshold_0']\n",
    "datasets = {'PASCAL-VOC': '../PASCAL-VOC', 'IN-1k': '../ImageNet-onek', 'IN-1k_v2': '../IN-1k_v2', 'CT-256': '../CalTech-256'}\n",
    "results_directories = {'ResNet': 'Results_resnet', 'RegNet': 'Results_regnet', 'EFN-V2': 'Results_efn_v2'} #, 'MBNet-v4': 'Results_mbnet_v4'}\n",
    "seeds = [42]\n",
    "\n",
    "for dataset_k, dataset_v in datasets.items():\n",
    "    for model_k, model_v in results_directories.items():\n",
    "        robustness_dict[f\"{model_k}-{dataset_k}\"] = {}\n",
    "        for threshold in thresholds_dirs:\n",
    "            beta_goodness_correct, beta_goodness_incorrect = robustness_metrics(os.path.join(dataset_v, model_v, threshold), seeds = seeds)\n",
    "            \n",
    "            for seed in seeds:      \n",
    "                for method in beta_goodness_correct[seed].keys():\n",
    "                    if method in ['min', 'max']:\n",
    "                        if method[0].upper() + method[1:] not in robustness_dict[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict[f\"{model_k}-{dataset_k}\"][method[0].upper() + method[1:]] = []\n",
    "                        robustness_dict[f\"{model_k}-{dataset_k}\"][method[0].upper() + method[1:]].append(beta_goodness_correct[seed][method]['mean'])\n",
    "                    \n",
    "                    if method == 'mean':\n",
    "                        if 'Avg' not in robustness_dict[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict[f\"{model_k}-{dataset_k}\"][\"Avg\"] = []\n",
    "                        robustness_dict[f\"{model_k}-{dataset_k}\"][\"Avg\"].append(beta_goodness_correct[seed][method]['mean'])\n",
    "\n",
    "                    if method == 0:\n",
    "                        if 'Zero' not in robustness_dict[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict[f\"{model_k}-{dataset_k}\"][\"Zero\"] = []\n",
    "                        robustness_dict[f\"{model_k}-{dataset_k}\"][\"Zero\"].append(beta_goodness_correct[seed][method]['mean'])\n",
    "                    \n",
    "                    if method == 'AD':\n",
    "                        if 'AD' not in robustness_dict[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict[f\"{model_k}-{dataset_k}\"][\"AD\"] = []\n",
    "                        robustness_dict[f\"{model_k}-{dataset_k}\"][\"AD\"].append(beta_goodness_correct[seed][method]['mean'])\n",
    "\n",
    "robustness_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "new_robustness_dict = {}\n",
    "for k, v in robustness_dict.items():\n",
    "    new_key = k\n",
    "    if 'RegNet' in k:\n",
    "        new_key = new_key.replace('RegNet', 'RegNetY')\n",
    "    \n",
    "    if 'EFN-V2' in k:\n",
    "        new_key = new_key.replace('EFN-V2', 'EfficientNetV2')\n",
    "    \n",
    "    if 'CalTech-256' in k:\n",
    "        new_key = new_key.replace('CalTech-256', 'CT-256')\n",
    "    \n",
    "    new_robustness_dict[new_key] = {}\n",
    "    for k2, v2 in v.items():\n",
    "        new_robustness_dict[new_key][k2] = list(reversed(v2))\n",
    "\n",
    "new_robustness_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "new_robustness_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "# json.dump(new_robustness_dict, open('Plots/robustness_dict.json', 'w'))\n",
    "new_robustness_dict = json.load(open('Plots/robustness_data.json', 'r'))\n",
    "new_robustness_dict\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from robustness_plot_code_v2 import create_figure\n",
    "create_figure(data=new_robustness_dict, y_lim=[0, 100], save_path_base='Plots/plot')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Task-2: Calculate Model Accuracy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "thresholds_dirs = ['Threshold_0.9', 'Threshold_0.7', 'Threshold_0.5', 'Threshold_0.3', 'Threshold_0.1', 'Threshold_0']\n",
    "datasets = {'IN-1k': '../ImageNet-onek', 'IN-1k_v2': '../IN-1k_v2', 'CT-256': '../CalTech-256'}\n",
    "results_directories = {'ResNet': 'Results_resnet', 'RegNet': 'Results_regnet', 'EFN-V2': 'Results_efn_v2'}\n",
    "masking_vals = ['AD', '0', 'mean', 'min', 'max']\n",
    "model_accuracy_dict = {}\n",
    "\n",
    "\n",
    "for dataset_k, dataset_v in datasets.items():\n",
    "    for model_k, model_v in results_directories.items():\n",
    "        model_accuracy_dict[f\"{model_k}-{dataset_k}\"] = {}\n",
    "        for masking_val in masking_vals:\n",
    "            model_accuracy_dict[f\"{model_k}-{dataset_k}\"][masking_val] = []\n",
    "            for threshold in thresholds_dirs:\n",
    "                print(\"Masking Value:\", masking_val)\n",
    "                if masking_val != 'AD':\n",
    "                    exp_dir = [os.path.join(dataset_v, model_v, threshold, folder) \\\n",
    "                            for folder in os.listdir(os.path.join(dataset_v, model_v, threshold)) if f\"val_{masking_val}\" in folder]\n",
    "                else:\n",
    "                    exp_dir = [os.path.join(dataset_v, model_v, threshold, folder) \\\n",
    "                            for folder in os.listdir(os.path.join(dataset_v, model_v, threshold)) if masking_val in folder]\n",
    "                \n",
    "                # print(exp_dir)\n",
    "                assert len(exp_dir) == 1\n",
    "                exp_dir = exp_dir[0]\n",
    "\n",
    "                #Load explanation logs\n",
    "                df = pd.read_csv(os.path.join(exp_dir, f\"{exp_dir.split('/')[-1]}.csv\"))\n",
    "\n",
    "                #Calculate model accuracy\n",
    "                try:\n",
    "                    model_accuracy = ((df[' actual classification'] == df[' predicted classification']).sum() * 100) / len(df)\n",
    "                except:\n",
    "                    model_accuracy = ((df[' target'] == df[' classification']).sum() * 100) / len(df)\n",
    "                \n",
    "                model_accuracy_dict[f\"{model_k}-{dataset_k}\"][masking_val].append(model_accuracy)\n",
    "\n",
    "model_accuracy_dict"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Task-3: Calculate Robustness for Background Images as well"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "robustness_dict_iid = {}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "thresholds_dirs = ['Threshold_0.9', 'Threshold_0.7', 'Threshold_0.5', 'Threshold_0.3', 'Threshold_0.1', 'Threshold_0']\n",
    "datasets = {'PASCAL-VOC': '../PASCAL-VOC', 'IN-1k': '../ImageNet-onek', 'IN-1k_v2': '../IN-1k_v2', 'CT-256': '../CalTech-256'}\n",
    "results_directories = {'ResNet': 'Results_resnet', 'RegNet': 'Results_regnet', 'EFN-V2': 'Results_efn_v2'} #, 'MBNet-v4': 'Results_mbnet_v4'}\n",
    "seeds = [42]\n",
    "\n",
    "for dataset_k, dataset_v in datasets.items():\n",
    "    for model_k, model_v in results_directories.items():\n",
    "        robustness_dict_iid[f\"{model_k}-{dataset_k}\"] = {}\n",
    "        for threshold in thresholds_dirs:\n",
    "            beta_goodness_correct, beta_goodness_incorrect = robustness_metrics_images(os.path.join(dataset_v, model_v, threshold), seeds = seeds)\n",
    "            \n",
    "            for seed in seeds:      \n",
    "                for method in beta_goodness_correct[seed].keys():\n",
    "                    if method in ['min', 'max']:\n",
    "                        if method[0].upper() + method[1:] not in robustness_dict_iid[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict_iid[f\"{model_k}-{dataset_k}\"][method[0].upper() + method[1:]] = []\n",
    "                        robustness_dict_iid[f\"{model_k}-{dataset_k}\"][method[0].upper() + method[1:]].append(beta_goodness_correct[seed][method]['mean'])\n",
    "                    \n",
    "                    if method == 'mean':\n",
    "                        if 'Avg' not in robustness_dict_iid[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict_iid[f\"{model_k}-{dataset_k}\"][\"Avg\"] = []\n",
    "                        robustness_dict_iid[f\"{model_k}-{dataset_k}\"][\"Avg\"].append(beta_goodness_correct[seed][method]['mean'])\n",
    "\n",
    "                    if method == 0:\n",
    "                        if 'Zero' not in robustness_dict_iid[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict_iid[f\"{model_k}-{dataset_k}\"][\"Zero\"] = []\n",
    "                        robustness_dict_iid[f\"{model_k}-{dataset_k}\"][\"Zero\"].append(beta_goodness_correct[seed][method]['mean'])\n",
    "                    \n",
    "                    if method == 'AD':\n",
    "                        if 'AD' not in robustness_dict_iid[f\"{model_k}-{dataset_k}\"]:\n",
    "                            robustness_dict_iid[f\"{model_k}-{dataset_k}\"][\"AD\"] = []\n",
    "                        robustness_dict_iid[f\"{model_k}-{dataset_k}\"][\"AD\"].append(beta_goodness_correct[seed][method]['mean'])\n",
    "\n",
    "robustness_dict_iid"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Task-4: Calculate confidence drop-off and the likes"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "thresholds_dirs = ['Threshold_0.9', 'Threshold_0.7', 'Threshold_0.5', 'Threshold_0.3', 'Threshold_0.1', 'Threshold_0']\n",
    "datasets = {'PASCAL-VOC': '../PASCAL-VOC',} #'IN-1k': '../ImageNet-onek', 'IN-1k_v2': '../IN-1k_v2', 'CT-256': '../CalTech-256'}\n",
    "results_directories = {'ResNet': 'Results_resnet', 'RegNet': 'Results_regnet', 'EFN-V2': 'Results_efn_v2'}\n",
    "masking_vals = ['AD', '0', 'mean', 'min', 'max']\n",
    "conf_drop_off_dict = {}\n",
    "conf_drop_off_dict_correct = {}\n",
    "\n",
    "for dataset_k, dataset_v in datasets.items():\n",
    "    for model_k, model_v in results_directories.items():\n",
    "        conf_drop_off_dict[f\"{model_k}-{dataset_k}\"] = {}\n",
    "        conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"] = {}\n",
    "        for threshold in thresholds_dirs:\n",
    "            #Calculate the confidence drop-off for particular model, dataset and threshold\n",
    "            print(\"Model:\", model_k, \"Dataset:\", dataset_k, \"Threshold:\", threshold)\n",
    "            calculate_confidence_difference(threshold_dir = os.path.join(dataset_v, model_v, threshold))\n",
    "\n",
    "            #Load the confidence drop-off data (Common Samples)\n",
    "            df_common_stats_coloured_background = pd.read_csv(os.path.join(dataset_v, model_v, threshold, \\\n",
    "                f\"confidence_difference_colored_background_common_stats_seed_42.csv\"))\n",
    "            df_common_stats_background_img = pd.read_csv(os.path.join(dataset_v, model_v, threshold, \\\n",
    "                f\"confidence_difference_background_images_common_stats_seed_42.csv\"))\n",
    "\n",
    "            #Load the confidence drop-off data (Correct Samples)\n",
    "            df_correct_stats_coloured_background = pd.read_csv(os.path.join(dataset_v, model_v, threshold, \\\n",
    "                f\"confidence_difference_colored_background_correct_stats_seed_42.csv\"))\n",
    "            df_correct_stats_background_img = pd.read_csv(os.path.join(dataset_v, model_v, threshold, \\\n",
    "                f\"confidence_difference_background_images_correct_stats_seed_42.csv\"))\n",
    "            conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold] = {}\n",
    "            conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold] = {}\n",
    "            for masking_val in masking_vals:\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val] = {}\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val] = {}\n",
    "\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Explanation Confidence (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Average Explanation Confidence'].values[0]\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Explanation Confidence (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Std Explanation Confidence'].values[0] \n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Explanation Confidence (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Average Explanation Confidence'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Explanation Confidence (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Std Explanation Confidence'].values[0]\n",
    "\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Average Difference'].values[0]\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Std Difference'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Average Difference'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Std Difference'].values[0]\n",
    "\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference(absolute) (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Average Difference(absolute)'].values[0]\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference(absolute) (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Std Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference(absolute) (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Average Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference(absolute) (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Std Difference(absolute)'].values[0]\n",
    "\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Average Percentage Difference'].values[0]\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Std Percentage Difference'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Average Percentage Difference'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Std Percentage Difference'].values[0]\n",
    "\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference(absolute) (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Average Percentage Difference(absolute)'].values[0]\n",
    "                conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference(absolute) (Common) (CB)'] = df_common_stats_coloured_background[df_common_stats_coloured_background['Method'] == masking_val]['Std Percentage Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference(absolute) (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Average Percentage Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference(absolute) (Common) (BI)'] = df_common_stats_background_img[df_common_stats_background_img['Method'] == masking_val]['Std Percentage Difference(absolute)'].values[0]\n",
    "\n",
    "\n",
    "                #Now calculate the same for the correct samples\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Explanation Confidence (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Average Explanation Confidence'].values[0]\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Explanation Confidence (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Std Explanation Confidence'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Explanation Confidence (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Average Explanation Confidence'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Explanation Confidence (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Std Explanation Confidence'].values[0]\n",
    "\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Average Difference'].values[0]\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Std Difference'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Average Difference'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Std Difference'].values[0]\n",
    "\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference(absolute) (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Average Difference(absolute)'].values[0]\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference(absolute) (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Std Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Difference(absolute) (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Average Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Difference(absolute) (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Std Difference(absolute)'].values[0]\n",
    "\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Average Percentage Difference'].values[0]\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Std Percentage Difference'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Average Percentage Difference'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Std Percentage Difference'].values[0]\n",
    "\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference(absolute) (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Average Percentage Difference(absolute)'].values[0]\n",
    "                conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference(absolute) (Correct) (CB)'] = df_correct_stats_coloured_background[df_correct_stats_coloured_background['Method'] == masking_val]['Std Percentage Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Average Percentage Difference(absolute) (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Average Percentage Difference(absolute)'].values[0]\n",
    "                # conf_drop_off_dict_correct[f\"{model_k}-{dataset_k}\"][threshold][masking_val]['Std Percentage Difference(absolute) (Correct) (BI)'] = df_correct_stats_background_img[df_correct_stats_background_img['Method'] == masking_val]['Std Percentage Difference(absolute)'].values[0]\n",
    "\n",
    "                \n",
    "                \n",
    "\n",
    "conf_drop_off_dict            "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "average_difference_dict = {}\n",
    "avg_difference_dict = {}\n",
    "times_ad_min = 0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from create_plots import create_plot\n",
    "\n",
    "data_labels = ['AD', '0', 'min', 'mean', 'max']\n",
    "categories = ['Threshold_0.9', 'Threshold_0.7', 'Threshold_0.5', 'Threshold_0.3', 'Threshold_0.1', 'Threshold_0']\n",
    "dataset_dirs = {'ImageNet-onek': '../ImageNet-onek', 'IN-1k_v2': '../IN-1k_v2', 'CalTech-256': '../CalTech-256','PASCAL-VOC': '../PASCAL-VOC'}\n",
    "\n",
    "model_name = 'efn_v2'\n",
    "model_folder_name = 'EFN_v2'\n",
    "dataset = 'ImageNet-onek'\n",
    "metric = 'Average Explanation Confidence'\n",
    "average_difference_dict[f'{model_name}-{dataset}'] = []\n",
    "\n",
    "data = {}\n",
    "results_csv = pd.read_csv(os.path.join(dataset_dirs[dataset], f'Results_{model_name}',\n",
    "                                               categories[0],f'{model_folder_name}_AD_seed_42_threshold_0.9',\n",
    "                                               f'{model_folder_name}_AD_seed_42_threshold_0.9.csv'))\n",
    "try:\n",
    "    results_csv = results_csv[results_csv[' actual classification'] == results_csv[' predicted classification']]\n",
    "    # results_csv = results_csv[results_csv[' predicted classification'] == results_csv[' area']]\n",
    "except:\n",
    "    results_csv = results_csv[results_csv[' target'] == results_csv[' classification']]\n",
    "correct_files = results_csv['Filename']\n",
    "print('Length of correct files:', len(correct_files))\n",
    "results_db = db_to_pandas(os.path.join(dataset_dirs[dataset], f'Results_{model_name}',\n",
    "                                               categories[0],f'{model_folder_name}_AD_seed_42_threshold_0.9',\n",
    "                                               f'{model_folder_name}_AD_seed_42_threshold_0.9.db'))\n",
    "# print(results_db)\n",
    "original_conf_data = results_db[results_db['path'].isin(correct_files)].confidence.mean()\n",
    "print(original_conf_data)\n",
    "\n",
    "#Calculate the threshold confidence values\n",
    "threshold_conf_values = []\n",
    "for category in categories:\n",
    "    threshold_conf_values.append(float(category.split('_')[1])*original_conf_data)\n",
    "\n",
    "conf_values = []\n",
    "for category in categories:\n",
    "    conf_threshold_data = pd.read_csv(os.path.join(dataset_dirs[dataset], f'Results_{model_name}',\n",
    "                                                   category,'confidence_difference_colored_background_correct_stats_seed_42.csv'))\n",
    "    conf_values.append(float(category.split('_')[1])*original_conf_data)\n",
    "    for method in conf_threshold_data['Method'].unique():\n",
    "        if method not in data:\n",
    "            data[method] = []\n",
    "        if method == 'AD':\n",
    "            ad_val = round(abs(conf_threshold_data[conf_threshold_data['Method'] == method][metric].values[0]), 3)\n",
    "        data[method].append(round(abs(conf_threshold_data[conf_threshold_data['Method'] == method][metric].values[0]), 3))\n",
    "        conf_values.append(round(abs(conf_threshold_data[conf_threshold_data['Method'] == method][metric].values[0]), 3))\n",
    "    \n",
    "    average_difference_dict[f'{model_name}-{dataset}'].append(max(conf_values) - min(conf_values))\n",
    "    if ad_val == min(conf_values):\n",
    "        times_ad_min += 1\n",
    "\n",
    "average_difference_dict[f'{model_name}-{dataset}'] = np.mean(average_difference_dict[f'{model_name}-{dataset}'])\n",
    "print(average_difference_dict)\n",
    "create_plot(data, data_labels, categories, hlines = threshold_conf_values)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "times_ad_min"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "average_difference_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Second, Create a similar plot for the "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Task-5: Calculate the Energy-Pointing-Game Score"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Task-6: Calculate the Average Size of the explanations"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "size_dict = {}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "thresholds_dirs = ['Threshold_0.9', 'Threshold_0.7', 'Threshold_0.5', 'Threshold_0.3', 'Threshold_0.1', 'Threshold_0']\n",
    "datasets = {'IN-1k': '../ImageNet-onek', 'IN-1k_v2': '../IN-1k_v2', 'CT-256': '../CalTech-256', 'PASCAL-VOC': '../PASCAL-VOC'}\n",
    "results_directories = {'ResNet': 'Results_resnet', 'RegNet': 'Results_regnet', 'EFN-V2': 'Results_efn_v2'} #'MBNet-v4': 'Results_mbnet_v4'}\n",
    "model_sizes = {'ResNet': (224, 224), 'RegNet-IN-1k': (224, 224), 'RegNet': (384, 384), 'EFN-V2': (300, 300), 'MBNet-v4': (448, 448)}\n",
    "methods = ['Max','Min','Mean','Zero','AD']\n",
    "seeds = [42]\n",
    "\n",
    "for dataset_k, dataset_v in datasets.items():\n",
    "    for model_k, model_v in results_directories.items():\n",
    "        size_dict[f\"{model_k}-{dataset_k}\"] = {}\n",
    "        for threshold in thresholds_dirs:\n",
    "            if model_k == 'RegNet' and dataset_k == 'IN-1k':\n",
    "                img_size = model_sizes['RegNet-IN-1k']\n",
    "            else:\n",
    "                img_size = model_sizes[model_k]\n",
    "            \n",
    "            pixel_count_results = pd.read_csv(os.path.join(dataset_v, model_v, threshold, f\"pixel_count_results_seed_42.csv\"))\n",
    "            for method in methods:\n",
    "                avg_exp_size_perc = pixel_count_results[method].mean() / (img_size[0] * img_size[1])\n",
    "                if method not in size_dict[f\"{model_k}-{dataset_k}\"]:\n",
    "                    size_dict[f\"{model_k}-{dataset_k}\"][method] = []\n",
    "                size_dict[f\"{model_k}-{dataset_k}\"][method].append(avg_exp_size_perc)\n",
    "\n",
    "size_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(\"-----ResNet Scores---------\")\n",
    "print(\"IN-1k\",np.array(size_dict['ResNet-IN-1k']['AD']) - np.array(size_dict['ResNet-IN-1k']['Max']))\n",
    "print(\"IN-1k_v2\",np.array(size_dict['ResNet-IN-1k_v2']['AD']) - np.array(size_dict['ResNet-IN-1k_v2']['Max']))\n",
    "print(\"CalTech-256\",np.array(size_dict['ResNet-CT-256']['AD']) - np.array(size_dict['ResNet-CT-256']['Max']))\n",
    "print(\"PASCAL-VOC\",np.array(size_dict['ResNet-PASCAL-VOC']['AD']) - np.array(size_dict['ResNet-PASCAL-VOC']['Min']))\n",
    "\n",
    "print(\"-----RegNet Scores---------\")\n",
    "print(\"IN-1k\",np.array(size_dict['RegNet-IN-1k']['AD']) - np.array(size_dict['RegNet-IN-1k']['Max']))\n",
    "print(\"IN-1k_v2\",np.array(size_dict['RegNet-IN-1k_v2']['AD']) - np.array(size_dict['RegNet-IN-1k_v2']['Max']))\n",
    "print(\"CalTech-256\",np.array(size_dict['RegNet-CT-256']['AD']) - np.array(size_dict['RegNet-CT-256']['Mean']))\n",
    "print(\"PASCAL-VOC\",np.array(size_dict['RegNet-PASCAL-VOC']['AD']) - np.array(size_dict['RegNet-PASCAL-VOC']['Max']))\n",
    "\n",
    "print(\"-----EFN-V2 Scores---------\")\n",
    "print(\"IN-1k\",np.array(size_dict['EFN-V2-IN-1k']['AD']) - np.array(size_dict['EFN-V2-IN-1k']['Zero']))\n",
    "print(\"IN-1k_v2\",np.array(size_dict['EFN-V2-IN-1k_v2']['AD']) - np.array(size_dict['EFN-V2-IN-1k_v2']['Zero']))\n",
    "print(\"CalTech-256\",np.array(size_dict['EFN-V2-CT-256']['AD']) - np.array(size_dict['EFN-V2-CT-256']['Zero']))\n",
    "print(\"PASCAL-VOC\",np.array(size_dict['EFN-V2-PASCAL-VOC']['AD']) - np.array(size_dict['EFN-V2-PASCAL-VOC']['Zero']))\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## IN-1k"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "with open(\"../ImageNet-onek/bbox_data.csv\", \"r\") as f:\n",
    "    reader = csv.reader(f)\n",
    "    bbox_data = list(reader)[1:]\n",
    "bbox_data = list(map(lambda x: [x[0], [int(coord) for coord in x[1].split(' ')[:-1] if 'n' not in coord]], bbox_data))\n",
    "for i in range(len(bbox_data)):\n",
    "    num_obj = len(bbox_data[i][1]) // 4\n",
    "    coords_list = []\n",
    "    for j in range(num_obj):\n",
    "        coords_list.append(bbox_data[i][1][j*4:(j+1)*4])\n",
    "    bbox_data[i][1] = coords_list\n",
    "\n",
    "bbox_data_df = pd.DataFrame(bbox_data, columns=['File', 'Bounding Boxes'])\n",
    "\n",
    "# bbox_data\n",
    "# Now, we need to process the calculated files bounding boxes\n",
    "thresholds_dirs = ['Threshold_0.9', 'Threshold_0.7', 'Threshold_0.5', 'Threshold_0.3', 'Threshold_0.1', 'Threshold_0']\n",
    "results_directories = {'ResNet': '../ImageNet-onek/Results_resnet', 'RegNet': '../ImageNet-onek/Results_regnet', 'EFN-V2': '../ImageNet-onek/Results_efn_v2'}\n",
    "masking_vals = ['AD', '0', 'mean', 'min', 'max']\n",
    "model_sizes = {'ResNet': (224, 224), 'RegNet': (384, 384), 'EFN-V2': (300, 300), 'MBNet-v4': (448, 448)}\n",
    "dataset_path = '../ImageNet-onek/IN-onek_data/Test'\n",
    "\n",
    "for model_k, model_v in results_directories.items():\n",
    "    for threshold in thresholds_dirs:\n",
    "        for masking_val in masking_vals:\n",
    "            relevant_dir = [os.path.join(model_v, threshold, model_dir) for model_dir \\\n",
    "                    in os.listdir(os.path.join(model_v, threshold)) if masking_val in model_dir and \\\n",
    "                    os.path.isdir(os.path.join(model_v, threshold, model_dir))]\n",
    "            \n",
    "            assert len(relevant_dir) == 1, f\"Expected 1 directory, got {len(relevant_dir)} for {model_k} {threshold} {masking_val}\"\n",
    "            relevant_dir = relevant_dir[0]\n",
    "\n",
    "            for file in os.listdir(relevant_dir):\n",
    "                if file.endswith('.png'):\n",
    "                    bbox_coords = bbox_data_df[bbox_data_df['File'] == file.split('_class')[0]]['Bounding Boxes'].values[0]\n",
    "                    img_file = np.array(Image.open(os.path.join(dataset_path, file.replace('.png', '.jpeg'))))\n",
    "                    exp_file = np.array(Image.open(os.path.join(relevant_dir, file)))\n",
    "                    \n",
    "                    for bbox_coord in bbox_coords:\n",
    "                        x_min, y_min, x_max, y_max = bbox_coord\n",
    "\n",
    "                        #Need to figure out how to scale the bounding boxes\n",
    "                        s_x = model_sizes[model_k][0]/img_file.shape[0]\n",
    "                        s_y = model_sizes[model_k][1]/img_file.shape[1]\n",
    "\n",
    "                        x_min, x_max, y_min, y_max = int(x_min*s_x), int(x_max*s_x), int(y_min*s_y), int(y_max*s_y)\n",
    "                        print(x_min, x_max, y_min, y_max)\n",
    "\n",
    "                        thickness = 2\n",
    "                        color = (0, 0, 255)\n",
    "                        img_file = cv2.rectangle(img_file, (x_min, y_min), (x_max, y_max), color, thickness)\n",
    "                        exp_file = cv2.rectangle(exp_file, (x_min, y_min), (x_max, y_max), color, thickness)\n",
    "\n",
    "                        cv2.imshow('img', img_file)\n",
    "                        cv2.imshow('exp', exp_file)\n",
    "                        cv2.waitKey(0)\n",
    "                    sys.exit()\n",
    "    "
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "AD",
   "language": "python",
   "name": "ad"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
