{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np \n",
    "from minio_obj_storage import upload_numpy_as_blob, get_numpy_from_cloud\n",
    "\n",
    "container_name = 'hiker-scores'\n",
    "container_dir = 'cifar100'\n",
    "lts = []\n",
    "loss_grad = []\n",
    "loss = []\n",
    "loss_curvature = []\n",
    "for epoch in range(45):\n",
    "    lt_4_eph = get_numpy_from_cloud(container_name, container_dir, f\"learning_time_cifar100_resnet18_wd1_{epoch}.pt\")\n",
    "    loss_grad_4_eph = get_numpy_from_cloud(container_name, container_dir, f\"loss_grad_resnet18_wd1_{epoch}.npy\")\n",
    "    loss_4_eph = get_numpy_from_cloud(container_name, container_dir, f\"loss_resnet18_wd1_{epoch}.npy\")\n",
    "    loss_curvature_4_eph = get_numpy_from_cloud(container_name, container_dir, f\"loss_curvature_resnet18_wd1_{epoch}_h_0.001_n_10.npy\")\n",
    "    lts.append(lt_4_eph)\n",
    "    loss_grad.append(loss_grad_4_eph)\n",
    "    loss.append(loss_4_eph)\n",
    "    loss_curvature.append(loss_curvature_4_eph)\n",
    "\n",
    "lts = np.array(lts)\n",
    "loss_grads = np.array(loss_grad)\n",
    "losses = np.array(loss)\n",
    "loss_curvatures = np.array(loss_curvature)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "learning_time = 1 - lts.mean(axis=0)\n",
    "loss_grad = loss_grads.sum(axis=0)\n",
    "loss = losses.sum(axis=0)\n",
    "loss_curvature = loss_curvatures.mean(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "df = pd.DataFrame(data={'lt':learning_time, 'loss_grad': loss_grad, 'loss': loss, 'loss_curvature': loss_curvature})\n",
    "# Define the number of bins you want\n",
    "num_bins = 15  # Adjust this number as needed\n",
    "\n",
    "# Bin the data based on learning time\n",
    "df['lt_bins'] = pd.cut(df['lt'], bins=num_bins)\n",
    "binned_df = df.groupby('lt_bins').mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "import scienceplots\n",
    "\n",
    "plt.style.use(['ieee','science', 'grid'])\n",
    "textwidth = 3.31314\n",
    "aspect_ratio = 6/8\n",
    "scale = 1.0\n",
    "width = textwidth * scale\n",
    "height = width * aspect_ratio\n",
    "fig = plt.figure(figsize=(width, height))\n",
    "ax1 = fig.gca()\n",
    "\n",
    "# Define font size\n",
    "font_size = 12\n",
    "\n",
    "# Plot loss on ax1\n",
    "ax1.set_ylabel('CSL', color='g', fontsize=font_size)\n",
    "ax1.scatter(binned_df['lt'], binned_df['loss'], color='g', alpha=0.8, marker='x', label='Loss')\n",
    "ax1.tick_params(axis='y', labelcolor='g', labelsize=font_size)\n",
    "\n",
    "# Create a twin x-axis to plot 'loss_grad'\n",
    "ax2 = ax1.twinx()\n",
    "ax2.set_ylabel('CSG', color='b', fontsize=font_size)\n",
    "ax1.set_xlabel('Learning Time', fontsize=font_size)\n",
    "ax2.scatter(binned_df['lt'], binned_df['loss_grad'], color='b', alpha=0.8, marker='x', label='Loss Grad')\n",
    "ax2.tick_params(axis='y', labelcolor='b', labelsize=font_size)\n",
    "\n",
    "# Set x-axis tick size\n",
    "ax1.tick_params(axis='x', labelsize=font_size)\n",
    "\n",
    "# Set title with a larger font size\n",
    "plt.title('CIFAR-100', fontsize=font_size)\n",
    "\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "py3.11_tf",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
