{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "\"\"\"\n",
    "This notebook is used to test the distribution of rewards for the ARMO reward model.\n",
    "\"\"\"\n",
    "\n",
    "import json\n",
    "import glob\n",
    "\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Skipping /home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/llama32medium--shots-1--prompt-idx-1629-generations--armo-rm.json because it has no correct or incorrect scores\n",
      "Skipping /home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/llama32medium--shots-1--prompt-idx-2643-generations--armo-rm.json because it has no correct or incorrect scores\n",
      "Skipping /home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/llama32medium--shots-1--prompt-idx-4998-generations--armo-rm.json because it has no correct or incorrect scores\n",
      "Skipping /home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/llama32medium--shots-1--prompt-idx-3274-generations--armo-rm.json because it has no correct or incorrect scores\n",
      "Skipping /home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/llama32medium--shots-1--prompt-idx-2534-generations--armo-rm.json because it has no correct or incorrect scores\n",
      "Skipping /home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/llama32medium--shots-1--prompt-idx-2960-generations--armo-rm.json because it has no correct or incorrect scores\n",
      "Skipping /home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/llama32medium--shots-1--prompt-idx-2775-generations--armo-rm.json because it has no correct or incorrect scores\n"
     ]
    }
   ],
   "source": [
    "# Find all debug.json files in the specified directory\n",
    "debug_files = glob.glob('/home/anonymousanonymous/inference-rlhf/data/math/llama-3-3b/generations/*armo-rm.json')\n",
    "\n",
    "# Load the content of each file\n",
    "avg_correct_per_problem = []\n",
    "avg_incorrect_per_problem = []\n",
    "\n",
    "for file_path in debug_files:\n",
    "    with open(file_path, 'r') as f:\n",
    "        data = json.load(f)\n",
    "\n",
    "        correct_scores = [output['armo-rm'] for output in data if output['correct']]\n",
    "        incorrect_scores = [output['armo-rm'] for output in data if not output['correct']]\n",
    "\n",
    "        if len(correct_scores) == 0 or len(incorrect_scores) == 0:\n",
    "            print(f\"Skipping {file_path} because it has either no correct or incorrect scores\")\n",
    "            continue\n",
    "\n",
    "        max_score = max(max(correct_scores), max(incorrect_scores))\n",
    "        min_score = min(min(correct_scores), min(incorrect_scores))\n",
    "\n",
    "        # Normalize the scores to be between 0 and 1\n",
    "        correct_scores = [(score - min_score) / (max_score - min_score) for score in correct_scores]\n",
    "        incorrect_scores = [(score - min_score) / (max_score - min_score) for score in incorrect_scores]\n",
    "\n",
    "        avg_correct_per_problem.append(np.mean(correct_scores))\n",
    "        avg_incorrect_per_problem.append(np.mean(incorrect_scores))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAiwAAAGdCAYAAAAxCSikAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjEsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvc2/+5QAAAAlwSFlzAAAPYQAAD2EBqD+naQAAOuhJREFUeJzt3XtUVXX+//HXEQW8AWpcCy+oqIhoXkNNMTVkZkzLKXOcQa3RZsKZKTQnmlJEi6YmLy3NpinFvk5j9dW0nzkUMqKpqIVDad4RQyehtADB4SLs3x9+PXXiogfPgQ0+H2vttdyf/dn7vPcHWrz67L3PthiGYQgAAMDEmjV0AQAAANdCYAEAAKZHYAEAAKZHYAEAAKZHYAEAAKZHYAEAAKZHYAEAAKZHYAEAAKbXvKELcITKykp99dVXatu2rSwWS0OXAwAAroNhGLp48aICAgLUrFntcyhNIrB89dVXCgwMbOgyAABAHZw5c0a33XZbrX2aRGBp27atpCsn7OHh0cDVAHCo4mIpIODKv7/6SmrdumHraQQYMjQWhYWFCgwMtP4dr02TCCxXLwN5eHgQWICmxsXl+397ePDX9zowZGhsrud2Dm66BQAApkdgAQAApkdgAQAAptck7mEBANwcDMPQ5cuXVVFR0dCl4Dq5uLioefPmN/y1IwQWAECjUFZWpnPnzunSpUsNXQrs1KpVK/n7+8vV1bXOxyCwAABMr7KyUtnZ2XJxcVFAQIBcXV35otBGwDAMlZWV6ZtvvlF2dra6d+9+zS+IqwmBBQBgemVlZaqsrFRgYKBatWrV0OXADi1btlSLFi305ZdfqqysTO7u7nU6DjfdAgAajbr+3zkaliN+bvzkAQCA6RFYAACA6dkVWBITEzVo0CC1bdtWPj4+mjhxoo4dO2bTp6SkRDExMerQoYPatGmjSZMmKS8vr9bjGoah+fPny9/fXy1bttSYMWN04sQJ+88GAAA0SXYFlh07digmJkZ79+5VSkqKysvLdffdd6u4uNja5/HHH9f/+3//T++++6527Nihr776Svfdd1+tx33hhRf08ssv69VXX9W+ffvUunVrRUZGqqSkpG5nBQCAieTm5up3v/udgoKC5ObmpsDAQI0fP16pqakNXVoVSUlJ8vLyaugyqrDrKaHk5GSb9aSkJPn4+CgjI0MjRoxQQUGB3njjDb311lu66667JElr1qxRr169tHfvXt1xxx1VjmkYhpYtW6ann35aEyZMkCS9+eab8vX11aZNm/Tggw/W9dwAAGhwp0+f1rBhw+Tl5aUXX3xRffr0UXl5uT788EPFxMTo6NGjdh+zrKys2u80KS8vV4sWLRxRtunc0D0sBQUFkqT27dtLkjIyMlReXq4xY8ZY+/Ts2VMdO3ZUenp6tcfIzs5Wbm6uzT6enp4aMmRIjfuUlpaqsLDQZgEA3FwMQyourv/FMOyr89FHH5XFYtH+/fs1adIkBQcHq3fv3oqNjdXevXslSTk5OZowYYLatGkjDw8PPfDAAza3U8THx6tfv356/fXX1aVLF+ujwRaLRatWrdI999yj1q1b69lnn5Ukbd68Wf3795e7u7uCgoK0cOFCXb582Xq8/Px8PfLII/L19ZW7u7tCQ0O1ZcsWpaWlacaMGSooKJDFYpHFYlF8fPyN/aAcpM7fw1JZWanHHntMw4YNU2hoqKQrU16urq5VppJ8fX2Vm5tb7XGutvv6+l73PomJiVq4cGFdSweA67c9seZto+Lqr456sjTleLXtj48NrudKru3SJalNm/r/3KIiqXXr6+v77bffKjk5Wc8++6xaV7OTl5eXKisrrWFlx44dunz5smJiYjR58mSlpaVZ+548eVIbNmzQxo0b5eLiYm2Pj4/X888/r2XLlql58+b6+OOPFR0drZdffll33nmnsrKyNGvWLEnSggULVFlZqaioKF28eFHr1q1T165ddfjwYbm4uGjo0KFatmyZ5s+fb71HtU1DDHI16hxYYmJidOjQIe3atcuR9VyXuLg4xcbGWtcLCwsVGBhY73UAAFCbkydPyjAM9ezZs8Y+qampOnjwoLKzs61/y95880317t1bn3zyiQYNGiTpymWgN998U97e3jb7/+IXv9CMGTOs6w899JCefPJJTZs2TZIUFBSkRYsWad68eVqwYIG2bdum/fv368iRIwoODrb2ucrT01MWi0V+fn6OGQQHqVNgmT17trZs2aKdO3fqtttus7b7+fmprKxM+fn5NrMseXl5NZ741fa8vDz5+/vb7NOvX79q93Fzc5Obm1tdSgcANBGtWl2Z7WiIz71exnVcPzpy5IgCAwNt/sc7JCREXl5eOnLkiDWwdOrUqUpYkaSBAwfarH/22WfavXu39fKQJFVUVKikpESXLl1SZmambrvtNmtYaSzsCiyGYeh3v/ud3nvvPaWlpalLly422wcMGKAWLVooNTVVkyZNkiQdO3ZMOTk5Cg8Pr/aYXbp0kZ+fn1JTU60BpbCwUPv27dNvf/vbOpwSAOBmYLFc/6WZhtK9e3dZLJY63Vj7Y9VdUqquvaioSAsXLqz2CV13d3e1bNnyhmtpCHbddBsTE6N169bprbfeUtu2bZWbm6vc3Fz997//lXRlGunhhx9WbGystm/froyMDM2YMUPh4eE2Twj17NlT7733nqQrNww99thjWrx4sd5//30dPHhQ0dHRCggI0MSJEx13pgAA1LP27dsrMjJSK1eutPkKkKvy8/PVq1cvnTlzRmfOnLG2Hz58WPn5+QoJCbH7M/v3769jx46pW7duVZZmzZopLCxMZ8+e1fHj1d+v5OrqqoqKCrs/19nsmmFZtWqVJCkiIsKmfc2aNZo+fbokaenSpWrWrJkmTZqk0tJSRUZG6pVXXrHpf+zYMesTRpI0b948FRcXa9asWcrPz9fw4cOVnJxc5xckAQBgFitXrtSwYcM0ePBgJSQkKCwsTJcvX1ZKSopWrVqlw4cPq0+fPpo6daqWLVumy5cv69FHH9XIkSOrXO65HvPnz9fPfvYzdezYUT//+c/VrFkzffbZZzp06JAWL16skSNHasSIEZo0aZKWLFmibt266ejRo7JYLBo3bpw6d+6soqIipaamqm/fvmrVqpUpXjhp1wyLYRjVLlfDinRlumnlypX69ttvVVxcrI0bN1a5f+XH+1gsFiUkJCg3N1clJSXatm1bo7u2BgBAdYKCgnTgwAGNGjVKc+bMUWhoqMaOHavU1FStWrVKFotFmzdvVrt27TRixAiNGTNGQUFBevvtt+v0eZGRkdqyZYs++ugjDRo0SHfccYeWLl2qTp06Wfts2LBBgwYN0pQpUxQSEqJ58+ZZZ1WGDh2q3/zmN5o8ebK8vb31wgsvOGQcbpTFuJ47gkyusLBQnp6eKigokIeHR0OXA8CRiou/f3bVnudJHaURPtZ8I0Nm1seaS0pKlJ2dbfMdJGg8avr52fP3m5cfAgAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAADgRNOnT2+yL/ONiIjQY489Vi+fRWABAKAJKysrq9JWUVGhysrKBqim7ggsAADUk4iICP3+97/XvHnz1L59e/n5+Sk+Pt6mT35+vh555BH5+vrK3d1doaGh2rJli3X7hg0b1Lt3b7m5ualz58566aWXbPbv3LmzFi1apOjoaHl4eGjWrFlKSkqSl5eX3n//fYWEhMjNzU05OTkqLS3V3Llzdeutt6p169YaMmSI0tLSbI63e/duRUREqFWrVmrXrp0iIyP13Xffafr06dqxY4eWL18ui8Uii8Wi06dPO2nkpOZOOzIAAM5kGNKlS/X/ua1aSRZLnXdfu3atYmNjtW/fPqWnp2v69OkaNmyYxo4dq8rKSkVFRenixYtat26dunbtqsOHD8vFxUWSlJGRoQceeEDx8fGaPHmy9uzZo0cffVQdOnTQ9OnTrZ/xl7/8RfPnz9eCBQskSR9//LEuXbqkP//5z3r99dfVoUMH+fj4aPbs2Tp8+LDWr1+vgIAAvffeexo3bpwOHjyo7t27KzMzU6NHj9ZDDz2k5cuXq3nz5tq+fbsqKiq0fPlyHT9+XKGhoUpISJAkeXt7131cr4HAAgBonC5d+v611PXpBt8aHhYWZg0S3bt314oVK5SamqqxY8dq27Zt2r9/v44cOaLg4CtvyA4KCrLuu2TJEo0ePVrPPPOMJCk4OFiHDx/Wiy++aBNY7rrrLs2ZM8e6/vHHH6u8vFyvvPKK+vbtK0nKycnRmjVrlJOTo4CAAEnS3LlzlZycrDVr1ui5557TCy+8oIEDB+qVV16xHqt3797Wf7u6uqpVq1by8/Or83hcLy4JAQBQj8LCwmzW/f399fXXX0uSMjMzddttt1nDyo8dOXJEw4YNs2kbNmyYTpw4oYqKCmvbwIEDq+zr6upq89kHDx5URUWFgoOD1aZNG+uyY8cOZWVlWesZPXp03U7UwZhhAQA0Tq1aXZntaIjPvQEtWrSwWbdYLNYbYFu2bHlDx76qdTUzQC1btpTlB5eyioqK5OLiooyMDOslp6va/N/MlaPqcQQCCwCgcbJYbujSjBmFhYXp7NmzOn78eLWzLL169dLu3btt2nbv3q3g4OAqoeNabr/9dlVUVOjrr7/WnXfeWWM9qampWrhwYbXbXV1dbWZ2nIlLQgAAmMTIkSM1YsQITZo0SSkpKcrOztY///lPJScnS5LmzJmj1NRULVq0SMePH9fatWu1YsUKzZ071+7PCg4O1tSpUxUdHa2NGzcqOztb+/fvV2Jioj744ANJUlxcnD755BM9+uij+vzzz3X06FGtWrVK58+fl3TliaR9+/bp9OnTOn/+vFMflSawAABgIhs2bNCgQYM0ZcoUhYSEaN68edZZjP79++udd97R+vXrFRoaqvnz5yshIcHmhlt7rFmzRtHR0ZozZ4569OihiRMn6pNPPlHHjh0lXQk1H330kT777DMNHjxY4eHh2rx5s5o3v3KBZu7cuXJxcVFISIi8vb2Vk5PjkDGojsUwDMNpR68nhYWF8vT0VEFBgTw8PBq6HACOVFz8/ZMgN/h0Rp1sT6x526i4+qvDDjcyZEtTjlfb/vjY6m8CrS8lJSXKzs5Wly5d5O7u3qC1wH41/fzs+fvNDAsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA93tYMAGjUanqdgDPU9RUFubm5evbZZ/XBBx/oP//5j3x8fNSvXz899thjGj16tIOrvDFJSUl67LHHlJ+f39Cl2CCwAADgRKdPn9awYcPk5eWlF198UX369FF5ebk+/PBDxcTE6OjRo3Yfs6ysTK6urlXay8vL1aJFC0eUbTp2XxLauXOnxo8fr4CAAFksFm3atMlmu8ViqXZ58cUXazxmfHx8lf49e/a0+2QAADCbRx99VBaLRfv379ekSZMUHBys3r17KzY2Vnv37pUk5eTkaMKECWrTpo08PDz0wAMPKC8vz3qM+Ph49evXT6+//rrNCwQtFotWrVqle+65R61bt9azzz4rSdq8ebP69+8vd3d3BQUFaeHChbp8+bL1ePn5+XrkkUfk6+srd3d3hYaGasuWLUpLS9OMGTNUUFBg/XscHx9ff4NVC7tnWIqLi9W3b1899NBDuu+++6psP3funM36P//5Tz388MOaNGlSrcft3bu3tm3b9n1hzZn8AQA0bt9++62Sk5P17LPPqnU1r8328vJSZWWlNazs2LFDly9fVkxMjCZPnqy0tDRr35MnT2rDhg3auHGjXFxcrO3x8fF6/vnntWzZMjVv3lwff/yxoqOj9fLLL+vOO+9UVlaWZs2aJUlasGCBKisrFRUVpYsXL2rdunXq2rWrDh8+LBcXFw0dOlTLli3T/PnzdezYMUlSm6uv/m5gdqeCqKgoRUVF1bjdz8/PZn3z5s0aNWqUgoKCai+kefMq+wIA0JidPHlShmHUetUgNTVVBw8eVHZ2tgIDAyVJb775pnr37q1PPvlEgwYNknTlMtCbb74pb29vm/1/8YtfaMaMGdb1hx56SE8++aSmTZsmSQoKCtKiRYs0b948LViwQNu2bdP+/ft15MgRBQcHW/tc5enpKYvFYrq/yU6dxsjLy9MHH3ygtWvXXrPviRMnFBAQIHd3d4WHhysxMVEdO3astm9paalKS0ut64WFhQ6rGQAARzEM45p9jhw5osDAQGtYkaSQkBB5eXnpyJEj1sDSqVOnKmFFkgYOHGiz/tlnn2n37t3Wy0OSVFFRoZKSEl26dEmZmZm67bbbrGGlsXBqYFm7dq3atm1b7aWjHxoyZIiSkpLUo0cPnTt3TgsXLtSdd96pQ4cOqW3btlX6JyYmauHChc4qGwAAh+jevbssFkudbqz9seouKVXXXlRUpIULF1b7t9fd3V0tW7a84VoaglO/h2X16tWaOnWq9eagmkRFRen+++9XWFiYIiMjtXXrVuXn5+udd96ptn9cXJwKCgqsy5kzZ5xRPgAAN6R9+/aKjIzUypUrVVxcXGV7fn6+evXqpTNnztj8LTt8+LDy8/MVEhJi92f2799fx44dU7du3aoszZo1U1hYmM6ePavjx6t/HNzV1VUVFRV2f66zOW2G5eOPP9axY8f09ttv272vl5eXgoODdfLkyWq3u7m5yc3N7UZLBADA6VauXKlhw4Zp8ODBSkhIUFhYmC5fvqyUlBStWrVKhw8fVp8+fTR16lQtW7ZMly9f1qOPPqqRI0dWudxzPebPn6+f/exn6tixo37+85+rWbNm+uyzz3To0CEtXrxYI0eO1IgRIzRp0iQtWbJE3bp109GjR2WxWDRu3Dh17txZRUVFSk1NVd++fdWqVSu1atXKCSNjH6fNsLzxxhsaMGCA+vbta/e+RUVFysrKkr+/vxMqAwCg/gQFBenAgQMaNWqU5syZo9DQUI0dO1apqalatWqVLBaLNm/erHbt2mnEiBEaM2aMgoKC6vQ//JIUGRmpLVu26KOPPtKgQYN0xx13aOnSperUqZO1z4YNGzRo0CBNmTJFISEhmjdvnnVWZejQofrNb36jyZMny9vbWy+88IJDxuFGWYzruSPoB4qKiqwzH7fffruWLFmiUaNGqX379tabZAsLC+Xv76+XXnpJv/nNb6ocY/To0br33ns1e/ZsSdLcuXM1fvx4derUSV999ZUWLFigzMxMHT58uNobjH6ssLBQnp6eKigokIeHhz2nA8Dsioulq49VFhVJNVzHd5rtiTVvGxVXf3XY4UaGrKZvja3rN7w6SklJibKzs22+gwSNR00/P3v+ftt9SejTTz/VqFGjrOuxsbGSpGnTpikpKUmStH79ehmGoSlTplR7jKysLJ0/f966fvbsWU2ZMkUXLlyQt7e3hg8frr17915XWAEAAE2f3YElIiLimo9pzZo1y/olNdU5ffq0zfr69evtLQMAANxEeFszAAAwPQILAAAwPV7YA6BhOONm1kZ4gyyA68MMCwAAMD0CCwAAMD0CCwAAMD0CCwAAMD0CCwAAMD2eEgIANG61PR3maHV42mz69OnKz8/Xpk2bHF9PA4uIiFC/fv20bNkyp38WMywAADRhZWVlVdoqKipUWVnZANXUHYEFAIB6EhERod///veaN2+e2rdvLz8/P8XHx9v0yc/P1yOPPCJfX1+5u7srNDRUW7ZssW7fsGGDevfuLTc3N3Xu3FkvvfSSzf6dO3fWokWLFB0dLQ8PD82aNUtJSUny8vLS+++/r5CQELm5uSknJ0elpaWaO3eubr31VrVu3VpDhgxRWlqazfF2796tiIgItWrVSu3atVNkZKS+++47TZ8+XTt27NDy5ctlsVhksViqvHrHkQgsAADUo7Vr16p169bat2+fXnjhBSUkJCglJUWSVFlZqaioKO3evVvr1q3T4cOH9fzzz8vFxUWSlJGRoQceeEAPPvigDh48qPj4eD3zzDPWlw9f9Ze//EV9+/bVv//9bz3zzDOSpEuXLunPf/6zXn/9dX3xxRfy8fHR7NmzlZ6ervXr1+vzzz/X/fffr3HjxunEiROSpMzMTI0ePVohISFKT0/Xrl27NH78eFVUVGj58uUKDw/XzJkzde7cOZ07d06BgYFOGzfuYQEAoB6FhYVpwYIFkqTu3btrxYoVSk1N1dixY7Vt2zbt379fR44cUXBwsCQpKCjIuu+SJUs0evRoawgJDg7W4cOH9eKLL2r69OnWfnfddZfmzJljXf/4449VXl6uV155RX379pUk5eTkaM2aNcrJyVFAQIAkae7cuUpOTtaaNWv03HPP6YUXXtDAgQP1yiuvWI/Vu3dv679dXV3VqlUr+fn5OXiUqmKGBQCAehQWFmaz7u/vr6+//lrSlRmN2267zRpWfuzIkSMaNmyYTduwYcN04sQJVVRUWNsGDhxYZV9XV1ebzz548KAqKioUHBysNm3aWJcdO3YoKyvLWs/o0aPrdqIOxgwLAAD1qEWLFjbrFovFegNsy5YtHfIZrVu3rtLWsmVLWSwW63pRUZFcXFyUkZFhveR0VZs2bRxajyMwwwIAgEmEhYXp7NmzOn78eLXbe/Xqpd27d9u07d69W8HBwVVCx7Xcfvvtqqio0Ndff61u3brZLFcv8YSFhSk1NbXGY7i6utrM7DgTgQUAAJMYOXKkRowYoUmTJiklJUXZ2dn65z//qeTkZEnSnDlzlJqaqkWLFun48eNau3atVqxYoblz59r9WcHBwZo6daqio6O1ceNGZWdna//+/UpMTNQHH3wgSYqLi9Mnn3yiRx99VJ9//rmOHj2qVatW6fz585KuPJG0b98+nT59WufPn3fqo9IEFgAATGTDhg0aNGiQpkyZopCQEM2bN886i9G/f3+98847Wr9+vUJDQzV//nwlJCTY3HBrjzVr1ig6Olpz5sxRjx49NHHiRH3yySfq2LGjpCuh5qOPPtJnn32mwYMHKzw8XJs3b1bz5lfuKJk7d65cXFwUEhIib29v5eTkOGQMqmMxDMNw2tHrSWFhoTw9PVVQUCAPD4+GLgfA9ajt20l/+G2ixcXS/11PV1GRVM21ebuPaQ9nHNPJ7BmyH1uaUv2liMfHVn8TaH0pKSlRdna2unTpInd39watBfar6ednz99vZlgAAIDpEVgAAIDpEVgAAIDpEVgAAIDpEVgAAIDpEVgAAI1GE3iw9abkiJ8bgQUAYHpXv87+0qVLDVwJ6uLqz+3HryWwB+8SAgCYnouLi7y8vKwvCWzVqpXNe3FgToZh6NKlS/r666/l5eVl9+sDfojAAgBoFK6+3+ZqaEHj4eXlZf351RWBBQDQKFgsFvn7+8vHx0fl5eUNXQ6uU4sWLW5oZuUqAgsAoFFxcXFxyB9ANC7cdAsAAEyPwAIAAEyPwAIAAEzP7sCyc+dOjR8/XgEBAbJYLNq0aZPN9unTp8tisdgs48aNu+ZxV65cqc6dO8vd3V1DhgzR/v377S0NAAA0UXYHluLiYvXt21crV66ssc+4ceN07tw56/KPf/yj1mO+/fbbio2N1YIFC3TgwAH17dtXkZGRPLoGAAAk1eEpoaioKEVFRdXax83Nza7nrZcsWaKZM2dqxowZkqRXX31VH3zwgVavXq0nn3zS3hIBAEAT45R7WNLS0uTj46MePXrot7/9rS5cuFBj37KyMmVkZGjMmDHfF9WsmcaMGaP09PRq9yktLVVhYaHNAgAAmi6Hfw/LuHHjdN9996lLly7KysrSU089paioKKWnp1f73Pz58+dVUVEhX19fm3ZfX18dPXq02s9ITEzUwoULHV06cPPanljztlFx9VdHQ6nt/AGYgsMDy4MPPmj9d58+fRQWFqauXbsqLS1No0ePdshnxMXFKTY21rpeWFiowMBAhxwbAACYj9Mfaw4KCtItt9yikydPVrv9lltukYuLi/Ly8mza8/LyarwPxs3NTR4eHjYLAABoupweWM6ePasLFy7I39+/2u2urq4aMGCAUlNTrW2VlZVKTU1VeHi4s8sDAACNgN2BpaioSJmZmcrMzJQkZWdnKzMzUzk5OSoqKtITTzyhvXv36vTp00pNTdWECRPUrVs3RUZGWo8xevRorVixwroeGxurv/3tb1q7dq2OHDmi3/72tyouLrY+NQQAAG5udt/D8umnn2rUqFHW9av3kkybNk2rVq3S559/rrVr1yo/P18BAQG6++67tWjRIrm5uVn3ycrK0vnz563rkydP1jfffKP58+crNzdX/fr1U3JycpUbcQEAwM3J7sASEREhwzBq3P7hhx9e8xinT5+u0jZ79mzNnj3b3nIAAMBNgHcJAQAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA07P7XUIAgJvP0pTj19338bHBTqwENytmWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOkRWAAAgOk1b+gCAKCK7Ynf//u/Zd//e8dfpJ8sqP96nOGH5/hjo+Lqrw6gkWCGBQAAmB6BBQAAmB6BBQAAmB6BBQAAmJ7dgWXnzp0aP368AgICZLFYtGnTJuu28vJy/fGPf1SfPn3UunVrBQQEKDo6Wl999VWtx4yPj5fFYrFZevbsaffJAACApsnuwFJcXKy+fftq5cqVVbZdunRJBw4c0DPPPKMDBw5o48aNOnbsmO65555rHrd37946d+6cddm1a5e9pQEAgCbK7seao6KiFBUVVe02T09PpaSk2LStWLFCgwcPVk5Ojjp27FhzIc2by8/Pz95yAADATcDp97AUFBTIYrHIy8ur1n4nTpxQQECAgoKCNHXqVOXk5NTYt7S0VIWFhTYLAABoupwaWEpKSvTHP/5RU6ZMkYeHR439hgwZoqSkJCUnJ2vVqlXKzs7WnXfeqYsXL1bbPzExUZ6entYlMDDQWacAAABMwGmBpby8XA888IAMw9CqVatq7RsVFaX7779fYWFhioyM1NatW5Wfn6933nmn2v5xcXEqKCiwLmfOnHHGKQAAAJNwylfzXw0rX375pf71r3/VOrtSHS8vLwUHB+vkyZPVbndzc5Obm5sjSgUAAI2Aw2dYroaVEydOaNu2berQoYPdxygqKlJWVpb8/f0dXR4AAGiE7A4sRUVFyszMVGZmpiQpOztbmZmZysnJUXl5uX7+85/r008/1d///ndVVFQoNzdXubm5Kiv7/gVmo0eP1ooVK6zrc+fO1Y4dO3T69Gnt2bNH9957r1xcXDRlypQbP0MAANDo2X1J6NNPP9WoUaOs67GxsZKkadOmKT4+Xu+//74kqV+/fjb7bd++XREREZKkrKwsnT9/3rrt7NmzmjJlii5cuCBvb28NHz5ce/fulbe3t73lAQCAJsjuwBIRESHDMGrcXtu2q06fPm2zvn79envLAAAANxHeJQQAAEyPwAIAAEzPKY81AwBuzNKU49W2Pz42+Jr9S/9rkdTdGWXdkJrOqSbXc67X0x9NAzMsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9Jo3dAEATG57Ys3bRsXVXx1X1VaPM/Zz8jHTT12o0rb38vEa+y9NqXnbHTmvSZL+W+oq6TlJ0r61T6mlW5n2dpx1Y4UCDYwZFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHoEFgAAYHp2B5adO3dq/PjxCggIkMVi0aZNm2y2G4ah+fPny9/fXy1bttSYMWN04sSJax535cqV6ty5s9zd3TVkyBDt37/f3tIAAEATZXdgKS4uVt++fbVy5cpqt7/wwgt6+eWX9eqrr2rfvn1q3bq1IiMjVVJSUuMx3377bcXGxmrBggU6cOCA+vbtq8jISH399df2lgcAAJoguwNLVFSUFi9erHvvvbfKNsMwtGzZMj399NOaMGGCwsLC9Oabb+qrr76qMhPzQ0uWLNHMmTM1Y8YMhYSE6NVXX1WrVq20evVqe8sDAABNkEPvYcnOzlZubq7GjBljbfP09NSQIUOUnp5e7T5lZWXKyMiw2adZs2YaM2ZMjfuUlpaqsLDQZgEAAE2XQwNLbm6uJMnX19em3dfX17rtx86fP6+Kigq79klMTJSnp6d1CQwMdED1AADArBrlU0JxcXEqKCiwLmfOnGnokgAAgBM5NLD4+flJkvLy8mza8/LyrNt+7JZbbpGLi4td+7i5ucnDw8NmAQAATZdDA0uXLl3k5+en1NRUa1thYaH27dun8PDwavdxdXXVgAEDbPaprKxUampqjfsAAICbS3N7dygqKtLJkyet69nZ2crMzFT79u3VsWNHPfbYY1q8eLG6d++uLl266JlnnlFAQIAmTpxo3Wf06NG69957NXv2bElSbGyspk2bpoEDB2rw4MFatmyZiouLNWPGjBs/QwAA0OjZHVg+/fRTjRo1yroeGxsrSZo2bZqSkpI0b948FRcXa9asWcrPz9fw4cOVnJwsd3d36z5ZWVk6f/68dX3y5Mn65ptvNH/+fOXm5qpfv35KTk6uciMuAAC4OdkdWCIiImQYRo3bLRaLEhISlJCQUGOf06dPV2mbPXu2dcYFAADghxrlU0IAAODmQmABAACmR2ABAACmR2ABAACmR2ABAACmR2ABAACmR2ABAACmR2ABAACmR2ABAACmR2ABAACmR2ABAACmZ/e7hACgIaWfulClLTyoQwNU0jDuyHmtoUu4pqUpxxu6BDRBzLAAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTI7AAAADTa97QBQBAU5N+6kK17eFBHeq5ksZtacrxhi4BJsIMCwAAMD0CCwAAMD0CCwAAMD0CCwAAMD2HB5bOnTvLYrFUWWJiYqrtn5SUVKWvu7u7o8sCAACNmMOfEvrkk09UUVFhXT906JDGjh2r+++/v8Z9PDw8dOzYMeu6xWJxdFkAAKARc3hg8fb2tll//vnn1bVrV40cObLGfSwWi/z8/BxdCgAAaCKceg9LWVmZ1q1bp4ceeqjWWZOioiJ16tRJgYGBmjBhgr744otaj1taWqrCwkKbBQAANF1ODSybNm1Sfn6+pk+fXmOfHj16aPXq1dq8ebPWrVunyspKDR06VGfPnq1xn8TERHl6elqXwMBAJ1QPAADMwqmB5Y033lBUVJQCAgJq7BMeHq7o6Gj169dPI0eO1MaNG+Xt7a2//vWvNe4TFxengoIC63LmzBlnlA8AAEzCaV/N/+WXX2rbtm3auHGjXfu1aNFCt99+u06ePFljHzc3N7m5ud1oiQAAoJFw2gzLmjVr5OPjo5/+9Kd27VdRUaGDBw/K39/fSZUBAIDGximBpbKyUmvWrNG0adPUvLntJE50dLTi4uKs6wkJCfroo4906tQpHThwQL/85S/15Zdf6te//rUzSgMAAI2QUy4Jbdu2TTk5OXrooYeqbMvJyVGzZt/npO+++04zZ85Ubm6u2rVrpwEDBmjPnj0KCQlxRmkAAKARckpgufvuu2UYRrXb0tLSbNaXLl2qpUuXOqMMAADQRPAuIQAAYHoEFgAAYHpOe6wZABpa+qkL1baHB3Wo50quqKmeH7sj5zUnVwI0PsywAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA0yOwAAAA02ve0AUA9WZ7Ys3bRsXVXx03i9rGu5FJP3Wh2vbwoA71XAlw82KGBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmJ7DA0t8fLwsFovN0rNnz1r3effdd9WzZ0+5u7urT58+2rp1q6PLAgAAjZhTZlh69+6tc+fOWZddu3bV2HfPnj2aMmWKHn74Yf373//WxIkTNXHiRB06dMgZpQEAgEbIKYGlefPm8vPzsy633HJLjX2XL1+ucePG6YknnlCvXr20aNEi9e/fXytWrHBGaQAAoBFySmA5ceKEAgICFBQUpKlTpyonJ6fGvunp6RozZoxNW2RkpNLT02vcp7S0VIWFhTYLAABoupo7+oBDhgxRUlKSevTooXPnzmnhwoW68847dejQIbVt27ZK/9zcXPn6+tq0+fr6Kjc3t8bPSExM1MKFCx1dOmAe2xNr3jYqrv7quJba6myE0k9daOgS4ARLU45fd9/HxwY7sRLcCIfPsERFRen+++9XWFiYIiMjtXXrVuXn5+udd95x2GfExcWpoKDAupw5c8ZhxwYAAObj8BmWH/Py8lJwcLBOnjxZ7XY/Pz/l5eXZtOXl5cnPz6/GY7q5ucnNzc2hdQIAAPNy+vewFBUVKSsrS/7+/tVuDw8PV2pqqk1bSkqKwsPDnV0aAABoJBweWObOnasdO3bo9OnT2rNnj+699165uLhoypQpkqTo6GjFxX1/Df4Pf/iDkpOT9dJLL+no0aOKj4/Xp59+qtmzZzu6NAAA0Eg5/JLQ2bNnNWXKFF24cEHe3t4aPny49u7dK29vb0lSTk6OmjX7PicNHTpUb731lp5++mk99dRT6t69uzZt2qTQ0FBHlwYAABophweW9evX17o9LS2tStv999+v+++/39GlAACAJoJ3CQEAANMjsAAAANMjsAAAANMjsAAAANMjsAAAANMjsAAAANMjsAAAANMjsAAAANMjsAAAANMjsAAAANMjsAAAANNz+LuEgCZne2LN20bF1bzNWeyoZ2nK8SpdHh8b7OiKbkj6qQu1bm9WWq4h//fvfae/ldxaOL8oNErV/b6j6WCGBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmF7zhi4AgANtT7RZvSPnQjV9OtRTMfUn/VQ15wkbd+S8Vqf99nac5eBKgLphhgUAAJgegQUAAJgegQUAAJgegQUAAJiewwNLYmKiBg0apLZt28rHx0cTJ07UsWPHat0nKSlJFovFZnF3d3d0aQAAoJFyeGDZsWOHYmJitHfvXqWkpKi8vFx33323iouLa93Pw8ND586dsy5ffvmlo0sDAACNlMMfa05OTrZZT0pKko+PjzIyMjRixIga97NYLPLz83N0OQAAoAlw+j0sBQUFkqT27dvX2q+oqEidOnVSYGCgJkyYoC+++KLGvqWlpSosLLRZAABA0+XUwFJZWanHHntMw4YNU2hoaI39evToodWrV2vz5s1at26dKisrNXToUJ09e7ba/omJifL09LQugYGBzjoFAABgAk4NLDExMTp06JDWr19fa7/w8HBFR0erX79+GjlypDZu3Chvb2/99a9/rbZ/XFycCgoKrMuZM2ecUT4AADAJp301/+zZs7Vlyxbt3LlTt912m137tmjRQrfffrtOnjxZ7XY3Nze5ubk5okwAANAIOHyGxTAMzZ49W++9957+9a9/qUuXLnYfo6KiQgcPHpS/v7+jywMAAI2Qw2dYYmJi9NZbb2nz5s1q27atcnNzJUmenp5q2bKlJCk6Olq33nqrEhOvvKgtISFBd9xxh7p166b8/Hy9+OKL+vLLL/XrX//a0eUBAIBGyOGBZdWqVZKkiIgIm/Y1a9Zo+vTpkqScnBw1a/b95M53332nmTNnKjc3V+3atdOAAQO0Z88ehYSEOLo8AADQCDk8sBiGcc0+aWlpNutLly7V0qVLHV0KAABoIniXEAAAMD0CCwAAMD2nPdYMSdsTa942Kq7+6rhRtZ1HbW7kHOs6dnWtta4aYmycJP3UhWrbw4M6OOQ4ZuKoGhvDuTrTHTmv1bp9b8dZ9VSJ4yxNOV5t++Njgx3SH3XHDAsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADA9AgsAADC95g1dQKOwPbHmbaPiHH/Ma6nrZ9bmRuqpz2M6i8lqTT91wa7+4UEdnHZs3NzuyHnNVJ+5t+OseqzE8ZamHK+2/fGxwfVcSc3MWiMzLAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPQILAAAwPScFlhWrlypzp07y93dXUOGDNH+/ftr7f/uu++qZ8+ecnd3V58+fbR161ZnlQYAABoZpwSWt99+W7GxsVqwYIEOHDigvn37KjIyUl9//XW1/ffs2aMpU6bo4Ycf1r///W9NnDhREydO1KFDh5xRHgAAaGScEliWLFmimTNnasaMGQoJCdGrr76qVq1aafXq1dX2X758ucaNG6cnnnhCvXr10qJFi9S/f3+tWLHCGeUBAIBGprmjD1hWVqaMjAzFxcVZ25o1a6YxY8YoPT292n3S09MVGxtr0xYZGalNmzZV27+0tFSlpaXW9YKCAklSYWHhDVZfg+KSmrfV9pm17XcjnHGezqrVGRpizB3tGj/D4v+W1rq9yuFqOG97j2PPsWviiM/8oWal5bo6WsX/LVVlZaVDj98U/bfUkP5v1K6MWVmD1FFSXFSn/Wr7HarrMW9UTX9faqrHUf0bQn3WePWYhmFcu7PhYP/5z38MScaePXts2p944glj8ODB1e7TokUL46233rJpW7lypeHj41Nt/wULFhiSWFhYWFhYWJrAcubMmWvmC4fPsNSHuLg4mxmZyspKffvtt+rQoYMsFovTP7+wsFCBgYE6c+aMPDw8nP55TRlj6TiMpWMwjo7DWDpOUx1LwzB08eJFBQQEXLOvwwPLLbfcIhcXF+Xl5dm05+Xlyc/Pr9p9/Pz87Orv5uYmNzc3mzYvL6+6F11HHh4eTeoXpyExlo7DWDoG4+g4jKXjNMWx9PT0vK5+Dr/p1tXVVQMGDFBqaqq1rbKyUqmpqQoPD692n/DwcJv+kpSSklJjfwAAcHNxyiWh2NhYTZs2TQMHDtTgwYO1bNkyFRcXa8aMGZKk6Oho3XrrrUpMTJQk/eEPf9DIkSP10ksv6ac//anWr1+vTz/9VK+99pozygMAAI2MUwLL5MmT9c0332j+/PnKzc1Vv379lJycLF9fX0lSTk6OmjX7fnJn6NCheuutt/T000/rqaeeUvfu3bVp0yaFhoY6o7wb5ubmpgULFlS5LAX7MZaOw1g6BuPoOIyl4zCWksUwrudZIgAAgIbDu4QAAIDpEVgAAIDpEVgAAIDpEVgAAIDpEVhqsHLlSnXu3Fnu7u4aMmSI9u/ff137rV+/XhaLRRMnTnRugY2IPWOZlJQki8Vis7i7u9djteZm7+9lfn6+YmJi5O/vLzc3NwUHB2vr1q31VK152TOOERERVX4nLRaLfvrTn9ZjxeZl7+/ksmXL1KNHD7Vs2VKBgYF6/PHHVVLSSN4B5mT2jGV5ebkSEhLUtWtXubu7q2/fvkpOTq7HahvA9bwf6Gazfv16w9XV1Vi9erXxxRdfGDNnzjS8vLyMvLy8WvfLzs42br31VuPOO+80JkyYUD/Fmpy9Y7lmzRrDw8PDOHfunHXJzc2t56rNyd6xLC0tNQYOHGj85Cc/MXbt2mVkZ2cbaWlpRmZmZj1Xbi72juOFCxdsfh8PHTpkuLi4GGvWrKnfwk3I3rH8+9//bri5uRl///vfjezsbOPDDz80/P39jccff7yeKzcfe8dy3rx5RkBAgPHBBx8YWVlZxiuvvGK4u7sbBw4cqOfK6w+BpRqDBw82YmJirOsVFRVGQECAkZiYWOM+ly9fNoYOHWq8/vrrxrRp0wgs/8fesVyzZo3h6elZT9U1LvaO5apVq4ygoCCjrKysvkpsFOry3/cPLV261Gjbtq1RVFTkrBIbDXvHMiYmxrjrrrts2mJjY41hw4Y5tc7GwN6x9Pf3N1asWGHTdt999xlTp051ap0NiUtCP1JWVqaMjAyNGTPG2tasWTONGTNG6enpNe6XkJAgHx8fPfzww/VRZqNQ17EsKipSp06dFBgYqAkTJuiLL76oj3JNrS5j+f777ys8PFwxMTHy9fVVaGionnvuOVVUVNRX2aZT19/JH3rjjTf04IMPqnXr1s4qs1Goy1gOHTpUGRkZ1ksdp06d0tatW/WTn/ykXmo2q7qMZWlpaZXL5S1bttSuXbucWmtDIrD8yPnz51VRUWH9Vt6rfH19lZubW+0+u3bt0htvvKG//e1v9VFio1GXsezRo4dWr16tzZs3a926daqsrNTQoUN19uzZ+ijZtOoylqdOndL//u//qqKiQlu3btUzzzyjl156SYsXL66Pkk2pLuP4Q/v379ehQ4f061//2lklNhp1Gctf/OIXSkhI0PDhw9WiRQt17dpVEREReuqpp+qjZNOqy1hGRkZqyZIlOnHihCorK5WSkqKNGzfq3Llz9VFygyCw3KCLFy/qV7/6lf72t7/plltuaehyGr3w8HBFR0erX79+GjlypDZu3Chvb2/99a9/bejSGp3Kykr5+Pjotdde04ABAzR58mT96U9/0quvvtrQpTVab7zxhvr06aPBgwc3dCmNUlpamp577jm98sorOnDggDZu3KgPPvhAixYtaujSGp3ly5ere/fu6tmzp1xdXTV79mzNmDHD5rU3TY1T3iXUmN1yyy1ycXFRXl6eTXteXp78/Pyq9M/KytLp06c1fvx4a1tlZaUkqXnz5jp27Ji6du3q3KJNyt6xrE6LFi10++236+TJk84osdGoy1j6+/urRYsWcnFxsbb16tVLubm5Kisrk6urq1NrNqMb+Z0sLi7W+vXrlZCQ4MwSG426jOUzzzyjX/3qV9YZqj59+qi4uFizZs3Sn/70pyb9x7Y2dRlLb29vbdq0SSUlJbpw4YICAgL05JNPKigoqD5KbhA3529HLVxdXTVgwAClpqZa2yorK5Wamqrw8PAq/Xv27KmDBw8qMzPTutxzzz0aNWqUMjMzFRgYWJ/lm4q9Y1mdiooKHTx4UP7+/s4qs1Goy1gOGzZMJ0+etAZoSTp+/Lj8/f1vyrAi3djv5LvvvqvS0lL98pe/dHaZjUJdxvLSpUtVQsnVQG3cxK+1u5HfS3d3d9166626fPmyNmzYoAkTJji73IbT0Hf9mtH69esNNzc3IykpyTh8+LAxa9Ysw8vLy/p47a9+9SvjySefrHF/nhL6nr1juXDhQuPDDz80srKyjIyMDOPBBx803N3djS+++KKhTsE07B3LnJwco23btsbs2bONY8eOGVu2bDF8fHyMxYsXN9QpmEJd//sePny4MXny5Pou19TsHcsFCxYYbdu2Nf7xj38Yp06dMj766COja9euxgMPPNBQp2Aa9o7l3r17jQ0bNhhZWVnGzp07jbvuusvo0qWL8d133zXQGTgfl4SqMXnyZH3zzTeaP3++cnNz1a9fPyUnJ1tviMrJyblppy7tZe9Yfvfdd5o5c6Zyc3PVrl07DRgwQHv27FFISEhDnYJp2DuWgYGB+vDDD/X4448rLCxMt956q/7whz/oj3/8Y0OdginU5b/vY8eOadeuXfroo48aomTTsncsn376aVksFj399NP6z3/+I29vb40fP17PPvtsQ52Cadg7liUlJXr66ad16tQptWnTRj/5yU/0P//zP/Ly8mqgM3A+i2HcxPNwAACgUWCaAAAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmB6BBQAAmN7/B8PjlwEElbt8AAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# Plot correct and incorrect score distributions\n",
    "plt.axvline(np.mean(avg_correct_per_problem), color='blue', label='Correct')\n",
    "plt.axvline(np.mean(avg_incorrect_per_problem), color='red', label='Incorrect')\n",
    "plt.hist(avg_correct_per_problem, bins=50, alpha=0.5, label='Correct')\n",
    "plt.hist(avg_incorrect_per_problem, bins=50, alpha=0.5, label='Incorrect')\n",
    "plt.legend()\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "llm-exploration",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.11"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
