{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np \n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib.patches as patches\n",
    "import pandas as pd \n",
    "import json\n",
    "import os\n",
    "import glob"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "hyper_path = 'DIR_TO_HYPERPARAMETERS'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# Group runs by configuration (ignoring the 'seed' value).\n",
    "grouped_runs = {}\n",
    "csv_files = glob.glob(os.path.join(hyper_path, '*', 'episodic_rewards.csv'))\n",
    "# Iterate over each csv file, extract its folder name and its args.txt.\n",
    "episodic_rewards = []\n",
    "smallest_eps_len = 1e9 \n",
    "for csv_file in csv_files:\n",
    "    folder_path = os.path.dirname(csv_file)\n",
    "    folder_name = os.path.basename(folder_path)\n",
    "    args_file = os.path.join(folder_path, \"args.txt\")\n",
    "    \n",
    "    if(smallest_eps_len > len(pd.read_csv(csv_file)['episode'])):\n",
    "        smallest_eps_len = len(pd.read_csv(csv_file)['episode'])\n",
    "        episodic_rewards = pd.read_csv(csv_file)['episode']\n",
    "\n",
    "    # Read the JSON config from args.txt.\n",
    "    with open(args_file, \"r\") as f:\n",
    "        config = json.load(f)\n",
    "    \n",
    "    # Remove the seed attribute, since it's the only differing part.\n",
    "    config.pop(\"seed\", None)\n",
    "    \n",
    "    # Create a key from the remaining configuration; sorting ensures consistent keys.\n",
    "    config_key = json.dumps(config, sort_keys=True)\n",
    "    \n",
    "    # Group folder names by the configuration key.\n",
    "    grouped_runs.setdefault(config_key, []).append(folder_name)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.figure(figsize=(12, 8))\n",
    "for csv_file in csv_files:\n",
    "    df_tmp = pd.read_csv(csv_file)\n",
    "    folder_name = os.path.basename(os.path.dirname(csv_file))\n",
    "    plt.plot(df_tmp['episode'], df_tmp['reward'], label=folder_name)\n",
    "\n",
    "plt.xlabel(\"Episode\")\n",
    "plt.ylabel(\"Reward\")\n",
    "plt.title(\"Reward per Episode for All Runs\")\n",
    "plt.legend(bbox_to_anchor=(1.05, 1), loc='upper left')\n",
    "plt.tight_layout()\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "plt.figure(figsize=(10, 6))\n",
    "best_avg = -np.inf\n",
    "best_config_key = None\n",
    "best_folder = None\n",
    "\n",
    "for config_key, folders in grouped_runs.items():\n",
    "    group_rewards = []\n",
    "\n",
    "    for folder in folders:\n",
    "        filepath = os.path.join(hyper_path, folder, 'episodic_rewards.csv')\n",
    "        df = pd.read_csv(filepath)\n",
    "        rewards = df['reward'].values[:smallest_eps_len]\n",
    "        group_rewards.append(rewards)\n",
    "\n",
    "    group_rewards = np.array(group_rewards)\n",
    "    avg_rewards = group_rewards.mean(axis=0)\n",
    "    avg_last100 = avg_rewards[-100:].mean()\n",
    "\n",
    "    label = config_key[:30] + '...' if len(config_key) > 30 else config_key\n",
    "    plt.plot(episodic_rewards, avg_rewards, label=label)\n",
    "\n",
    "    if avg_last100 > best_avg:\n",
    "        best_avg = avg_last100\n",
    "        best_config_key = config_key\n",
    "        best_folder = folders[0]  # choose the first folder in this group\n",
    "\n",
    "print(\"Best group config (highest average reward over the last 100 episodes):\")\n",
    "print(best_config_key)\n",
    "args_path = os.path.join(hyper_path, best_folder, 'args.txt')\n",
    "with open(args_path, 'r') as f:\n",
    "    print(f.read())\n",
    "\n",
    "plt.xlabel(\"Episode\")\n",
    "plt.ylabel(\"Average Episodic Reward\")\n",
    "plt.title(\"Average Episodic Reward per Episode for each grouped_run\")\n",
    "# plt.legend()\n",
    "plt.ylim(0, 700)\n",
    "plt.show()\n",
    "\n",
    "# Plot the best run in a separate figure\n",
    "# Retrieve all folders for the best configuration (across seeds 0, 1, 2)\n",
    "best_group_folders = grouped_runs[best_config_key]\n",
    "all_run_rewards = []\n",
    "\n",
    "for folder in best_group_folders:\n",
    "    filepath = os.path.join(hyper_path, folder, 'episodic_rewards.csv')\n",
    "    df_tmp = pd.read_csv(filepath)\n",
    "    rewards = df_tmp['reward'].values[:smallest_eps_len]\n",
    "    all_run_rewards.append(rewards)\n",
    "\n",
    "all_run_rewards = np.array(all_run_rewards)\n",
    "avg_best_run_rewards = all_run_rewards.mean(axis=0)\n",
    "\n",
    "plt.figure(figsize=(10, 6))\n",
    "plt.plot(episodic_rewards, avg_best_run_rewards, color='red', linewidth=2,\n",
    "         label='Best Run (Avg over 3 seeds)')\n",
    "plt.xlabel(\"Episode\")\n",
    "plt.ylabel(\"Reward\")\n",
    "plt.title(\"Reward per Episode for Best Run (Averaged over 3 seeds)\")\n",
    "plt.legend()\n",
    "plt.ylim(0, 700)\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "agar",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
