{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "73309e74",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "4f66d9a7",
   "metadata": {},
   "outputs": [],
   "source": [
    "assistant_o4_mini_high = {\n",
    "  \"Scalability\": [4, 5, 7, 5, 6, 6, 4, 4, 4],\n",
    "  \"Reliability\": [3, 4, 5, 4, 4, 3, 3, 3, 3],\n",
    "  \"Accuracy\": [6, 4, 4, 7, 5, 5, 6, 5, 6],\n",
    "  \"Usability\": [2, 3, 1, 5, 3, 4, 3, 3, 3],\n",
    "  \"Relevance\": [8, 3, 1, 9, 7, 8, 7, 8, 8],\n",
    "  \"Cost-effectiveness\": [3, 3, 3, 3, 4, 3, 3, 4, 3],\n",
    "  \"Documentation\": [2, 2, 1, 2, 3, 2, 2, 2, 2]\n",
    "}\n",
    "\n",
    "partial_intrinsic_memory_o4_mini_high = {\n",
    "  \"Scalability\": [6, 6, 5, 7, 6, 6, 4, 8, 4, 6],\n",
    "  \"Reliability\": [4, 5, 3, 6, 4, 5, 3, 3, 3, 5],\n",
    "  \"Accuracy\": [3, 3, 4, 5, 4, 4, 5, 4, 3, 5],\n",
    "  \"Usability\": [5, 2, 3, 3, 3, 3, 2, 2, 2, 3],\n",
    "  \"Relevance\": [6, 5, 8, 3, 7, 3, 6, 6, 8, 9],\n",
    "  \"Cost-effectiveness\": [4, 4, 2, 4, 5, 5, 3, 3, 4, 4],\n",
    "  \"Documentation\": [5, 2, 3, 2, 4, 4, 2, 1, 3, 3]\n",
    "}\n",
    "\n",
    "all_intrinsic_memory_o4_mini_high = {\n",
    "  \"Scalability\":           [6, 6, 6, 8, 8, 7, 8, 8, 6],\n",
    "  \"Reliability\":           [5, 4, 4, 6, 5, 5, 5, 6, 4],\n",
    "  \"Accuracy\":              [4, 3, 6, 5, 6, 3, 6, 4, 5],\n",
    "  \"Usability\":             [3, 4, 4, 4, 4, 3, 4, 4, 3],\n",
    "  \"Relevance\":             [6, 6, 2, 4, 5, 5, 8, 9, 8],\n",
    "  \"Cost-effectiveness\":    [4, 4, 3, 7, 4, 5, 6, 5, 4],\n",
    "  \"Documentation\":         [2, 5, 3, 3, 3, 4, 4, 3, 5]\n",
    "}\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "307415b3",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Assistant Scores: {'Scalability': 45, 'Reliability': 32, 'Accuracy': 48, 'Usability': 27, 'Relevance': 59, 'Cost-effectiveness': 29, 'Documentation': 18}\n",
      "Partial Memory Scores: {'Scalability': 58, 'Reliability': 41, 'Accuracy': 40, 'Usability': 28, 'Relevance': 61, 'Cost-effectiveness': 38, 'Documentation': 29}\n",
      "All Memory Scores: {'Scalability': 63, 'Reliability': 44, 'Accuracy': 42, 'Usability': 33, 'Relevance': 53, 'Cost-effectiveness': 42, 'Documentation': 32}\n"
     ]
    }
   ],
   "source": [
    "# Add total scores for each category across all rows for each column\n",
    "\n",
    "\n",
    "def calculate_scores(data):\n",
    "    scores = {}\n",
    "    for key in data:\n",
    "        scores[key] = sum(data[key])\n",
    "    return scores\n",
    "\n",
    "assistant_scores = calculate_scores(assistant_o4_mini_high)\n",
    "partial_memory_scores = calculate_scores(partial_intrinsic_memory_o4_mini_high)\n",
    "all_memory_scores = calculate_scores(all_intrinsic_memory_o4_mini_high)\n",
    "\n",
    "print(\"Assistant Scores:\", assistant_scores)\n",
    "print(\"Partial Memory Scores:\", partial_memory_scores)\n",
    "print(\"All Memory Scores:\", all_memory_scores)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d095fe1a",
   "metadata": {},
   "source": [
    "Total number of turns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "40372921",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "160 172 143\n",
      "0.11888111888111888\n"
     ]
    }
   ],
   "source": [
    "all_memory_agent = [14, 16, 20, 14, 16, 14, 16, 16, 16, 18]\n",
    "partial_memory_agent = [16, 18, 16, 16, 16, 16, 16, 26, 16, 16]\n",
    "assistant_agent = [17, 18, 10, 14, 16, 14, 14, 10, 14, 16]\n",
    "\n",
    "print(sum(all_memory_agent), sum(partial_memory_agent), sum(assistant_agent))\n",
    "\n",
    "print((160-143)/143)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "c62ab123",
   "metadata": {},
   "source": [
    "Total tokens with Llama3.2:latest"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "39bca690",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "478300 510346 360778\n",
      "0.32574602664242275\n"
     ]
    }
   ],
   "source": [
    "all_memory_agent = [38318, 51173, 63578, 38756, 45375, 37836, 45833, 54731, 46520, 56180]\n",
    "partial_memory_agent = [47614, 54196, 43763, 48305, 47300, 45453, 42921, 92147, 42474, 46173]\n",
    "assistant_agent = [45013, 50328, 18928, 33194, 43624, 37516, 35127, 17925, 35550, 43573]\n",
    "\n",
    "print(sum(all_memory_agent),sum(partial_memory_agent),sum(assistant_agent))\n",
    "\n",
    "print((478300-360778)/360778)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
