{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "977a7e78-c839-4b5e-b887-a4a9e4e53f79",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "_ROOT_PATH = os.path.join('..', '..', '..')\n",
    "_FINAL_DFS_DIR = os.path.join('..', '..', 'final_dfs')\n",
    "_CSV_DIR = os.path.join('..', '..', 'csv_files')\n",
    "\n",
    "import sys\n",
    "sys.path.append('..')\n",
    "sys.path.append(os.path.join('..', '..', '..', 'tools'))\n",
    "import plotconfig"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f3a04c65-a634-4f12-844e-cf388c26fb1e",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "import seaborn as sns\n",
    "import matplotlib.pyplot as plt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "833ce0e1-aaa2-4bbb-a2f7-55c3044b5aa2",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_file = os.path.join(_FINAL_DFS_DIR, 'optim_rmse_y_true_vs_y_reconstructed.parquet')\n",
    "result_df = pd.read_parquet(df_file, engine='pyarrow')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "472fee22-aab6-488b-a2c9-688d0d44cb80",
   "metadata": {},
   "outputs": [],
   "source": [
    "result_df.iloc[0]['true_labels'].shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6b3e7f6c-d475-4372-adc0-717b48eae8d4",
   "metadata": {},
   "outputs": [],
   "source": [
    "9234*170"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ab1ee846-da07-4796-8457-dd0955226bc8",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Assuming your DataFrame is named 'df'\n",
    "grouped_df = result_df.groupby(['method_name'])\n",
    "\n",
    "# Calculate mean and std for each subtable\n",
    "compiled_result = grouped_df.agg({\n",
    "    'rmse': ['mean', 'std']\n",
    "})\n",
    "\n",
    "# Flatten the column names\n",
    "compiled_result.columns = ['_'.join(col).strip() for col in compiled_result.columns.values]\n",
    "\n",
    "# Reset the index to display method_name and training_size as columns\n",
    "compiled_result = compiled_result.reset_index()\n",
    "compiled_result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9ed55c99-3ebe-4c99-8fb8-b72d3a5fc5ee",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Dictionary to store rmse values for each method\n",
    "rmse_values = {}\n",
    "true_labels = {}\n",
    "pred_labels = {}\n",
    "\n",
    "# Loop through each unique method name\n",
    "for method in result_df['method_name'].unique():\n",
    "    # Create a mask for the current method\n",
    "    mask = (result_df['method_name'] == method)\n",
    "    \n",
    "    # Filter the DataFrame and get the 'rmse' values\n",
    "    df = result_df[mask]\n",
    "    rmse_values[method] = df['rmse'].values\n",
    "    true_labels[method] = df['true_labels'].values\n",
    "    pred_labels[method] = df['pred_labels'].values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3ac1d7cd-6145-4f30-8a32-307bd0921a99",
   "metadata": {},
   "outputs": [],
   "source": [
    "true_labels.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f388c3b3-64b9-407e-9b50-64aa1a4a1184",
   "metadata": {},
   "outputs": [],
   "source": [
    "flattened_true_labels = {method: [label for sublist in labels for label in sublist] for method, labels in true_labels.items()}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5e32706b-7e5e-4d20-be66-955cb8434e58",
   "metadata": {},
   "outputs": [],
   "source": [
    "len(flattened_true_labels['LinearRegression'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "03e57b89-8d35-46fd-b3ce-602cdff244fb",
   "metadata": {},
   "outputs": [],
   "source": [
    "directory = '../../../user_experiments/results'\n",
    "\n",
    "dfs = []\n",
    "for filename in os.listdir(directory):\n",
    "    if filename.endswith('.csv'):\n",
    "        file_path = os.path.join(directory, filename)\n",
    "        df = pd.read_csv(file_path)\n",
    "        dfs.append(df)\n",
    "\n",
    "df = pd.concat(dfs, ignore_index=True)\n",
    "\n",
    "df['match'] = (df['target'] != df['chosen']).astype(int)\n",
    "mask = ((df['showing_time'] == 500))\n",
    "\n",
    "df_masked = df[mask]\n",
    "\n",
    "grouped_df = df_masked.groupby(['rounded_d', 'showing_time'])\n",
    "compiled_result = grouped_df.agg({\n",
    "    'match': ['mean', 'std', 'sem', 'count']\n",
    "})\n",
    "compiled_result.columns = ['_'.join(col).strip() for col in compiled_result.columns.values]\n",
    "compiled_result = compiled_result.reset_index()\n",
    "compiled_result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a2a21828-a5ed-43d9-abb2-08539277edbc",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# Dictionary to store rmse values for each method\n",
    "match_values = {}\n",
    "\n",
    "# Loop through each unique method name\n",
    "for rd in df_masked['rounded_d'].unique():\n",
    "    # Create a mask for the current method\n",
    "    mask = (df_masked['rounded_d'] == rd)\n",
    "    \n",
    "    # Filter the DataFrame and get the 'rmse' values\n",
    "    df = df_masked[mask]\n",
    "    match_values[rd] = df['match'].values\n",
    "\n",
    "match_values.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d4939dca-a8c1-4547-bdbc-07b6d0dc4512",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3128486d-0a19-40f2-8f7b-9d160cbca123",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "from scipy.stats import fisher_exact\n",
    "from itertools import combinations\n",
    "\n",
    "def pairwise_fisher_exact(match_values):\n",
    "    keys = list(match_values.keys())\n",
    "    results = {}\n",
    "\n",
    "    for (key1, key2) in combinations(keys, 2):\n",
    "        x1 = match_values[key1].sum()  # successes in group 1\n",
    "        n1 = len(match_values[key1])   # trials in group 1\n",
    "        x2 = match_values[key2].sum()  # successes in group 2\n",
    "        n2 = len(match_values[key2])   # trials in group 2\n",
    "\n",
    "        contingency_table = [[x1, n1 - x1], [x2, n2 - x2]]\n",
    "        \n",
    "        # Perform Fisher's Exact Test\n",
    "        odds_ratio, p_value = fisher_exact(contingency_table, alternative='two-sided')\n",
    "        \n",
    "        results[(key1, key2)] = {\n",
    "            'odds_ratio': odds_ratio,\n",
    "            'p_value': p_value\n",
    "        }\n",
    "\n",
    "    return results\n",
    "\n",
    "results = pairwise_fisher_exact(match_values)\n",
    "\n",
    "# # Print results\n",
    "# for (key1, key2), stats in results.items():\n",
    "#     print(f\"Comparison between {key1} and {key2}:\")\n",
    "#     print(f\"  Odds Ratio: {stats['odds_ratio']}\")\n",
    "#     print(f\"  P-value: {stats['p_value']}\")\n",
    "#     print()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e4805872-6434-43f1-aaea-6be060c2da0f",
   "metadata": {},
   "outputs": [],
   "source": [
    "results[(3.6, 21.7)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "afd5a16e-5297-408c-9691-52053f90f68b",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.19"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
