{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "d5e697cf-5b9c-4596-af90-c4ff422ae4bc",
   "metadata": {},
   "outputs": [],
   "source": [
    "# This code analyzes the shallow archtiectures cardinality\n",
    "# In particular, it finds architectures with a given expressive capacity "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "f826341b-96c3-44f7-aa91-6321048a525a",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import glob"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "fcacf24d-566e-4625-9293-c170cc90ef01",
   "metadata": {},
   "outputs": [],
   "source": [
    "def combine_csv_files(output_file=\"combined_results.csv\"):\n",
    "    # Find all CSV files that match the pattern 'result_p*.csv' in the current directory\n",
    "    csv_files = glob.glob(\"result_p*.csv\")\n",
    "\n",
    "    if not csv_files:\n",
    "        print(\"No matching CSV files found.\")\n",
    "        return\n",
    "\n",
    "    # Initialize an empty DataFrame to hold all data\n",
    "    combined_df = pd.DataFrame()\n",
    "\n",
    "    # Loop over each file and append its content to the combined DataFrame\n",
    "    for file in csv_files:\n",
    "        print(f\"Reading file: {file}\")\n",
    "        df = pd.read_csv(file)\n",
    "        combined_df = pd.concat([combined_df, df], ignore_index=True)\n",
    "\n",
    "    # # Remove duplicate rows if any\n",
    "    # combined_df.drop_duplicates(inplace=True)\n",
    "\n",
    "    # Sort the data by architecture parameters: n, m, k\n",
    "    if {\"n\", \"m\", \"k\"}.issubset(combined_df.columns):\n",
    "        combined_df.sort_values(by=[\"n\", \"m\", \"k\"], inplace=True)\n",
    "\n",
    "    # Save the cleaned and sorted DataFrame to a new CSV file\n",
    "    combined_df.to_csv(output_file, index=False)\n",
    "    print(f\"Combined results saved to: {output_file}\")\n",
    "\n",
    "def filter_architectures(df, n=None, m=None, k=None):\n",
    "    if n is not None:\n",
    "        df = df[df[\"n\"] == n]\n",
    "    if m is not None:\n",
    "        df = df[df[\"m\"] == m]\n",
    "    if k is not None:\n",
    "        df = df[df[\"k\"] == k]\n",
    "\n",
    "    # Sort by prime and r ascending\n",
    "    df = df.sort_values(by=[\"prime\", \"r\"], ascending=[True, True]) # Save the filtered results\n",
    "\n",
    "    return df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "37c426b6-ddcd-4a6b-8f02-021e4d91d9d7",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Reading file: result_p3_r2.csv\n",
      "Reading file: result_p7_r2.csv\n",
      "Reading file: result_p5_r2.csv\n",
      "Reading file: result_p2_r2.csv\n",
      "Reading file: result_p11_r2.csv\n",
      "Combined results saved to: combined_results.csv\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/var/folders/nn/jp9ysjms6wqcnl8v0zz7wnbm0000gn/T/ipykernel_47060/2433738703.py:16: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.\n",
      "  combined_df = pd.concat([combined_df, df], ignore_index=True)\n"
     ]
    }
   ],
   "source": [
    "# Combine all results\n",
    "combine_csv_files()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "b06c5090-39e6-4a4e-aefb-63402fe395c7",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>n</th>\n",
       "      <th>m</th>\n",
       "      <th>k</th>\n",
       "      <th>prime</th>\n",
       "      <th>r</th>\n",
       "      <th>cardinality</th>\n",
       "      <th>amb_space_card</th>\n",
       "      <th>ratio</th>\n",
       "      <th>dim_amb</th>\n",
       "      <th>time_sec</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>393</td>\n",
       "      <td>729</td>\n",
       "      <td>0.539095</td>\n",
       "      <td>6</td>\n",
       "      <td>0.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>7</td>\n",
       "      <td>2</td>\n",
       "      <td>59185</td>\n",
       "      <td>117649</td>\n",
       "      <td>0.503064</td>\n",
       "      <td>6</td>\n",
       "      <td>174.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>5</td>\n",
       "      <td>2</td>\n",
       "      <td>7945</td>\n",
       "      <td>15625</td>\n",
       "      <td>0.508480</td>\n",
       "      <td>6</td>\n",
       "      <td>11.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>16</td>\n",
       "      <td>64</td>\n",
       "      <td>0.250000</td>\n",
       "      <td>6</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   n  m  k  prime  r  cardinality  amb_space_card     ratio  dim_amb  time_sec\n",
       "0  2  2  2      3  2          393             729  0.539095        6       0.2\n",
       "1  2  2  2      7  2        59185          117649  0.503064        6     174.9\n",
       "2  2  2  2      5  2         7945           15625  0.508480        6      11.9\n",
       "3  2  2  2      2  2           16              64  0.250000        6       0.0"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "file_name = 'combined_results.csv'\n",
    "df = pd.read_csv(file_name)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "02fdba1b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0    0.539095\n",
       "1    0.503064\n",
       "2    0.508480\n",
       "3    0.250000\n",
       "Name: ratio, dtype: float64"
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df['ratio']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "ceaa9d88-05e6-447b-88af-57cfccec81be",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Empty DataFrame\n",
      "Columns: [n, m, k, prime, r, cardinality, amb_space_card, ratio, dim_amb, time_sec]\n",
      "Index: []\n"
     ]
    }
   ],
   "source": [
    "min_val = 0.9\n",
    "max_val = 1.1\n",
    "df_sorted = df.sort_values(by='ratio', ascending=True)\n",
    "df_filt = df_sorted[df_sorted['ratio'].between(min_val, max_val)]\n",
    "df_filt = df_filt[df_filt['prime'] > 2]\n",
    "print(df_filt)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5aa04c65-b657-477e-8684-e00b7ce89fe5",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
