{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "d593d6ef",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "06c9e51e",
   "metadata": {},
   "outputs": [],
   "source": [
    "def extract_ttft_tpot(data, share_ttft_con, share_tpot_cons,split_ttft_cons, split_tpot_cons):\n",
    "    ttfts = data['ttfts']\n",
    "    tpots = data['tpots']\n",
    "    e2els = data['e2els']\n",
    "    dataset = data['dataset']\n",
    "    ttft_class = [[],[]] # sharegpt, splitwise\n",
    "    tpot_class = [[],[]]\n",
    "    e2el_class = [[],[]]\n",
    "    goodput = [0,0]\n",
    "    for i in range(len(ttfts)):\n",
    "        idx = 0 if dataset[i] == 'sharegpt' else 1\n",
    "        ttft_class[idx].append(ttfts[i])\n",
    "        tpot_class[idx].append(tpots[i])\n",
    "        e2el_class[idx].append(e2els[i])\n",
    "        if (idx == 0 and ttfts[i] <= share_ttft_con and tpots[i] <= share_tpot_cons) or (idx==1 and ttfts[i] <= split_ttft_cons and tpots[i] <= split_tpot_cons):\n",
    "            goodput[idx] += 1\n",
    "    \n",
    "    scale = 1000\n",
    "    \n",
    "    print('-----sharegpt-----')\n",
    "    print(f'avg ttft: {round(np.mean(ttft_class[0])*scale,4)} ms')\n",
    "    print(f'avg tpot: {round(np.mean(tpot_class[0])*scale,4)} ms')\n",
    "    print(f'avg e2el: {round(np.mean(e2el_class[0])*scale,4)} ms')\n",
    "    print(f'goodput : {round(goodput[0]/len(ttft_class[0])*100,4)} %')\n",
    "    \n",
    "    print()\n",
    "    \n",
    "    print('-----splitwise-----')\n",
    "    print(f'avg ttft: {round(np.mean(ttft_class[1])*scale,4)} ms')\n",
    "    print(f'avg tpot: {round(np.mean(tpot_class[1])*scale,4)} ms')\n",
    "    print(f'avg e2el: {round(np.mean(e2el_class[1])*scale,4)} ms')\n",
    "    print(f'goodput : {round(goodput[1]/len(ttft_class[1])*100,4)} %')\n",
    "    \n",
    "\n",
    "def extract_throughput(data):\n",
    "    print(f\"token_throughput: {round(data['total_token_throughput'],4)} toks/s\")\n",
    "    print()\n",
    "\n",
    "def process_output(result_path,share_ttft_con, share_tpot_cons,split_ttft_cons, split_tpot_cons):\n",
    "    with open(result_path, 'r') as f:\n",
    "        data = json.load(f)\n",
    "        print(data.keys())\n",
    "        extract_throughput(data)\n",
    "        extract_ttft_tpot(data,share_ttft_con, share_tpot_cons,split_ttft_cons, split_tpot_cons)\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "cb888b1e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "dict_keys(['date', 'backend', 'model_id', 'tokenizer_id', 'best_of', 'num_prompts', 'request_rate', 'burstiness', 'max_concurrency', 'duration', 'completed', 'total_input_tokens', 'total_output_tokens', 'request_throughput', 'request_goodput:', 'output_throughput', 'total_token_throughput', 'input_lens', 'output_lens', 'ttfts', 'e2els', 'tpots', 'dataset', 'mean_ttft_ms', 'median_ttft_ms', 'std_ttft_ms', 'p99_ttft_ms', 'mean_tpot_ms', 'median_tpot_ms', 'std_tpot_ms', 'p99_tpot_ms', 'mean_itl_ms', 'median_itl_ms', 'std_itl_ms', 'p99_itl_ms', 'mean_e2el_ms', 'median_e2el_ms', 'std_e2el_ms', 'p99_e2el_ms'])\n",
      "token_throughput: 4298.9434 toks/s\n",
      "\n",
      "-----sharegpt-----\n",
      "avg ttft: 464.2457 ms\n",
      "avg tpot: 70.6599 ms\n",
      "avg e2el: 11420.0364 ms\n",
      "goodput : 90.2344 %\n",
      "\n",
      "-----splitwise-----\n",
      "avg ttft: 47946.5493 ms\n",
      "avg tpot: 409.6298 ms\n",
      "avg e2el: 57474.1158 ms\n",
      "goodput : 47.2656 %\n"
     ]
    }
   ],
   "source": [
    "# result_path = '../vllm-infqps-Qwen2.5-32B-20250426-184543.json'\n",
    "result_path = '/mnt/sda/2022-0526/home/xuhx/projects/gLLM/experiments/results/tmp/rate_8_dynamic.json'\n",
    "process_output(result_path, 1, 0.1, 50, 0.5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "88861c7f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "dict_keys(['date', 'backend', 'model_id', 'tokenizer_id', 'best_of', 'num_prompts', 'request_rate', 'burstiness', 'max_concurrency', 'duration', 'completed', 'total_input_tokens', 'total_output_tokens', 'request_throughput', 'request_goodput:', 'output_throughput', 'total_token_throughput', 'input_lens', 'output_lens', 'ttfts', 'e2els', 'tpots', 'dataset', 'mean_ttft_ms', 'median_ttft_ms', 'std_ttft_ms', 'p99_ttft_ms', 'mean_tpot_ms', 'median_tpot_ms', 'std_tpot_ms', 'p99_tpot_ms', 'mean_itl_ms', 'median_itl_ms', 'std_itl_ms', 'p99_itl_ms', 'mean_e2el_ms', 'median_e2el_ms', 'std_e2el_ms', 'p99_e2el_ms'])\n",
      "token_throughput: 5217.3938 toks/s\n",
      "\n",
      "-----sharegpt-----\n",
      "avg ttft: 447.4139 ms\n",
      "avg tpot: 69.8557 ms\n",
      "avg e2el: 11284.9133 ms\n",
      "goodput : 91.4062 %\n",
      "\n",
      "-----splitwise-----\n",
      "avg ttft: 50793.1442 ms\n",
      "avg tpot: 437.6696 ms\n",
      "avg e2el: 60921.8616 ms\n",
      "goodput : 34.9609 %\n"
     ]
    }
   ],
   "source": [
    "# result_path = '../vllm-infqps-Qwen2.5-32B-20250426-184543.json'\n",
    "result_path = '/mnt/sda/2022-0526/home/xuhx/projects/gLLM/experiments/results/tmp/rate_8_baseline3.json'\n",
    "process_output(result_path, 1, 0.1, 50, 0.5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "14c9f4e4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "dict_keys(['date', 'backend', 'model_id', 'tokenizer_id', 'best_of', 'num_prompts', 'request_rate', 'burstiness', 'max_concurrency', 'duration', 'completed', 'total_input_tokens', 'total_output_tokens', 'request_throughput', 'request_goodput:', 'output_throughput', 'total_token_throughput', 'input_lens', 'output_lens', 'ttfts', 'e2els', 'tpots', 'dataset', 'mean_ttft_ms', 'median_ttft_ms', 'std_ttft_ms', 'p99_ttft_ms', 'mean_tpot_ms', 'median_tpot_ms', 'std_tpot_ms', 'p99_tpot_ms', 'mean_itl_ms', 'median_itl_ms', 'std_itl_ms', 'p99_itl_ms', 'mean_e2el_ms', 'median_e2el_ms', 'std_e2el_ms', 'p99_e2el_ms'])\n",
      "token_throughput: 5481.942 toks/s\n",
      "\n",
      "-----sharegpt-----\n",
      "avg ttft: 497.8223 ms\n",
      "avg tpot: 78.4373 ms\n",
      "avg e2el: 12695.3589 ms\n",
      "goodput : 87.6953 %\n",
      "\n",
      "-----splitwise-----\n",
      "avg ttft: 47339.5689 ms\n",
      "avg tpot: 435.2925 ms\n",
      "avg e2el: 57394.8271 ms\n",
      "goodput : 42.2852 %\n"
     ]
    }
   ],
   "source": [
    "# result_path = '../vllm-infqps-Qwen2.5-32B-20250426-184543.json'\n",
    "result_path = '/mnt/sda/2022-0526/home/xuhx/projects/gLLM/experiments/results/tmp/rate_8_baseline0.json'\n",
    "process_output(result_path, 1, 0.1, 50, 0.5)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "gllm",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
