[
    {
        "num_requests": "4788",
        "input_tokens": "515839",
        "output_tokens": "1478328",
        "mean_ttft": "236.78",
        "median_ttft": "195.42",
        "p99_ttft": "1145.49",
        "hit_ratios": [
            "0.07484506594628954",
            "0.1287779237844941",
            "0.1410575858250277",
            "0.14406339308911406",
            "0.19419025324537137",
            "0.2251403887688985",
            "0.22347349177330897",
            "0.2562906510741739",
            "0.27797669792554713",
            "0.28983544049769233",
            "0.32736595500154725",
            "0.33938134441691326",
            "0.35330855018587376",
            "0.3575646980756471",
            "0.3529569812221991",
            "0.34808524995782486",
            "0.34965819548087457",
            "0.35711128572831746",
            "0.3429407791038055",
            "0.3378172478342258",
            "0.3338220607296912",
            "0.32261003360732066",
            "0.3196020014514341",
            "0.31780298858170863",
            "0.31604777886038027",
            "0.3124505996769648",
            "0.30833625160504935",
            "0.3053261866821188",
            "0.3082160059281215",
            "0.3024698723302708",
            "0.3031472081218274",
            "0.3094546903460837",
            "0.3097641250685682",
            "0.30987231392089687",
            "0.3035829776225584",
            "0.3062990266157803",
            "0.30997448669663447",
            "0.3110973312027473",
            "0.31179397131987097",
            "0.3209080047789723",
            "0.3266234416183812",
            "0.33220011295998586",
            "0.3322665423254628",
            "0.3374121865293612",
            "0.34056585445658927",
            "0.34159119072325905",
            "0.3406281439571273",
            "0.3412380659069908"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.03,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 3,
        "result_file": "sharegpt-reqrate+/client_logs/8002_lru.json"
    },
    {
        "num_requests": "5425",
        "input_tokens": "580658",
        "output_tokens": "1682011",
        "mean_ttft": "251.07",
        "median_ttft": "203.98",
        "p99_ttft": "1276.59",
        "hit_ratios": [
            "0.07928268050967437",
            "0.14793308447393888",
            "0.15557897510209456",
            "0.17971617323219966",
            "0.17819596299411267",
            "0.1876874228258952",
            "0.19285278878390735",
            "0.22373461012311902",
            "0.23294871020358845",
            "0.26766941614103185",
            "0.29514824797843664",
            "0.3090940873137264",
            "0.3143923031612017",
            "0.3267620751341683",
            "0.32153856024637506",
            "0.3199865513341689",
            "0.32429882494210494",
            "0.3114027172652041",
            "0.3060858455566203",
            "0.3041460247222356",
            "0.2945858087658334",
            "0.28797305414914603",
            "0.28593091128144404",
            "0.28449783006643486",
            "0.28486783964007384",
            "0.29185723854176626",
            "0.2888139487483555",
            "0.29112929155800077",
            "0.28864402655636273",
            "0.2932973155495525",
            "0.2957813447885754",
            "0.29742631797426317",
            "0.2920125353512192",
            "0.2919562183207229",
            "0.29738735002645544",
            "0.29738060720368215",
            "0.30118077727623027",
            "0.3086019480170048",
            "0.3164651381909548",
            "0.3183404370388493",
            "0.31687009535326055",
            "0.3164936077523793",
            "0.3169907119231567",
            "0.31768866510819394",
            "0.3199664052426747",
            "0.3248266842586484",
            "0.3226699546040464",
            "0.3233928591028329",
            "0.3288400983479274",
            "0.32905060291717125",
            "0.33149410587762085",
            "0.3287296690970275",
            "0.3291068045468898",
            "0.32933008621874804",
            "0.32933008621874804"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.04,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 4,
        "result_file": "sharegpt-reqrate+/client_logs/8003_lru.json"
    },
    {
        "num_requests": "4128",
        "input_tokens": "464689",
        "output_tokens": "1245935",
        "mean_ttft": "234.98",
        "median_ttft": "184.49",
        "p99_ttft": "1232.47",
        "hit_ratios": [
            "0.07273023104458186",
            "0.0763585259212992",
            "0.0889254222089374",
            "0.09487428809556886",
            "0.18296340731853628",
            "0.2398591887350988",
            "0.2604708458800985",
            "0.27847881454040285",
            "0.30459411703565115",
            "0.30661691989571166",
            "0.32502282742466954",
            "0.35503764790247405",
            "0.35853972232298925",
            "0.38155053377535825",
            "0.3702710835134175",
            "0.36695210910244225",
            "0.3552246434047299",
            "0.3512581567403594",
            "0.3551162935711169",
            "0.3537401840668352",
            "0.3475340026798334",
            "0.33974622097692436",
            "0.33903094150068025",
            "0.33006360515998895",
            "0.3250392672192588",
            "0.32261471119409835",
            "0.3217431070854293",
            "0.3205912334352701",
            "0.31796193442577764",
            "0.31814526936478155",
            "0.3237827137642038",
            "0.3245526532924471",
            "0.32315420952929036",
            "0.3242940517597123",
            "0.32855484152804443",
            "0.33506903618100575",
            "0.33246205642862514",
            "0.3283010999322316",
            "0.32764381100422924",
            "0.32883509228229874",
            "0.32899052113746347",
            "0.32899052113746347"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 2,
        "result_file": "sharegpt-reqrate+/client_logs/8001_lru.json"
    },
    {
        "num_requests": "2988",
        "input_tokens": "355242",
        "output_tokens": "909273",
        "mean_ttft": "246.82",
        "median_ttft": "185.16",
        "p99_ttft": "1512.09",
        "hit_ratios": [
            "0.036632498739707614",
            "0.05566343042071197",
            "0.06975648075412412",
            "0.14782276546982429",
            "0.2249091951825655",
            "0.29268667024787043",
            "0.32950411640819455",
            "0.33611499946161294",
            "0.35564044519901905",
            "0.3533460183798227",
            "0.36493553008595997",
            "0.3812903841869053",
            "0.3969096209912539",
            "0.40596072556049023",
            "0.40741104776882264",
            "0.4119326617784783",
            "0.40940174440031135",
            "0.4038826756699726",
            "0.4037691317408097",
            "0.4027936914470581",
            "0.3991954225634286",
            "0.3944496367089752",
            "0.3820316884686784",
            "0.373279768689705",
            "0.35720004725215604",
            "0.34459501654905406",
            "0.3407947994603215",
            "0.3374273335194244",
            "0.33728392066476626",
            "0.33728392066476626"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-reqrate+/client_logs/8000_lru.json"
    },
    {
        "num_requests": "2479",
        "input_tokens": "417556",
        "output_tokens": "749724",
        "mean_ttft": "295.10",
        "median_ttft": "207.53",
        "p99_ttft": "1475.92",
        "hit_ratios": [
            "0.0026790498303268444",
            "0.005864091065884788",
            "0.021877087508350036",
            "0.15992390615091948",
            "0.2679833478555522",
            "0.34244023595156775",
            "0.386813753951358",
            "0.39414062499999997",
            "0.3937986012617987",
            "0.39767779390420893",
            "0.4031979753824916",
            "0.39501407027924085",
            "0.3536532373207522",
            "0.3416019127316197",
            "0.32302521008403356",
            "0.30453975551144086",
            "0.29633187552139945",
            "0.25991053524602803",
            "0.24921355431225584",
            "0.2393003198769081",
            "0.23302614996849397",
            "0.22578494131992072",
            "0.22578494131992072",
            "0.22578494131992072",
            "0.22578494131992072"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.25,
        "result_file": "sharegpt-reqrate+/client_logs/8000_lru.json"
    },
    {
        "num_requests": "2411",
        "input_tokens": "347817",
        "output_tokens": "738010",
        "mean_ttft": "268.07",
        "median_ttft": "163.63",
        "p99_ttft": "1564.19",
        "hit_ratios": [
            "0.00705009276437848",
            "0.01837088388214905",
            "0.04828504828504829",
            "0.19668160348794964",
            "0.29063489108173524",
            "0.3447663684135776",
            "0.39551029854200415",
            "0.41503644035289605",
            "0.43309769184907587",
            "0.4378040043738924",
            "0.4484543102274275",
            "0.44093402475944965",
            "0.43183718985224423",
            "0.42819646569646574",
            "0.4195433964976164",
            "0.40138370062553874",
            "0.39134157547406223",
            "0.38215188137817563",
            "0.35163778209215746",
            "0.3342417061611374",
            "0.31826520759575144",
            "0.31826520759575144",
            "0.31826520759575144",
            "0.31826520759575144",
            "0.31826520759575144"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.5,
        "result_file": "sharegpt-reqrate+/client_logs/8001_lru.json"
    },
    {
        "num_requests": "4155",
        "input_tokens": "467117",
        "output_tokens": "1254997",
        "mean_ttft": "231.42",
        "median_ttft": "184.23",
        "p99_ttft": "1235.17",
        "hit_ratios": [
            "0.07273023104458186",
            "0.07651467832604623",
            "0.0995366910775669",
            "0.12251701625225728",
            "0.21975604879024194",
            "0.2640557424315233",
            "0.28572406241445386",
            "0.31125331488527613",
            "0.3213283442469598",
            "0.32545095575697747",
            "0.3401881773790147",
            "0.367335962710649",
            "0.3764264807445655",
            "0.3920858933025123",
            "0.38520666356648514",
            "0.38569507274727954",
            "0.38292190148858596",
            "0.3802718565225929",
            "0.38362927314968476",
            "0.3766842979035559",
            "0.3723911528445146",
            "0.3723138876020099",
            "0.3753482864307607",
            "0.36622144226706965",
            "0.36152660824629945",
            "0.35817663296274266",
            "0.3573403942335981",
            "0.35450758912813274",
            "0.35332297410651664",
            "0.35424299965232275",
            "0.35765412145001163",
            "0.3554738873388317",
            "0.35622436005086017",
            "0.35977970509667323",
            "0.3635414395704008",
            "0.36935637197338256",
            "0.36582034820574033",
            "0.36443370381558526",
            "0.3643847793367477",
            "0.36416744892048974",
            "0.36412062206350326",
            "0.36412062206350326"
        ],
        "args": " --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 2,
        "result_file": "sharegpt-reqrate++/client_logs/8003_ml.json"
    },
    {
        "num_requests": "3011",
        "input_tokens": "358288",
        "output_tokens": "912522",
        "mean_ttft": "251.31",
        "median_ttft": "189.35",
        "p99_ttft": "1542.96",
        "hit_ratios": [
            "0.036632498739707614",
            "0.05398832684824903",
            "0.06972361809045227",
            "0.1523128034755942",
            "0.2467023513668515",
            "0.3151972872996301",
            "0.34926400305868865",
            "0.3552446035361754",
            "0.3675808820046422",
            "0.37878541852723885",
            "0.38021883098186016",
            "0.4018525002387243",
            "0.41448979591836743",
            "0.42798673158204487",
            "0.43292383292383285",
            "0.43746571585298955",
            "0.4346464108758855",
            "0.4343056594365494",
            "0.430595002054195",
            "0.4352030947775629",
            "0.4371683123733556",
            "0.43245934284766013",
            "0.4235512245601932",
            "0.4177701896116154",
            "0.40326272858834356",
            "0.38738705053904166",
            "0.38389276560258045",
            "0.380142635358044",
            "0.37940048164776796",
            "0.37940048164776796",
            "0.37940048164776796"
        ],
        "args": " --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-reqrate++/client_logs/8002_ml.json"
    },
    {
        "num_requests": "2516",
        "input_tokens": "425686",
        "output_tokens": "757799",
        "mean_ttft": "430.19",
        "median_ttft": "219.32",
        "p99_ttft": "9267.39",
        "hit_ratios": [
            "0.0026790498303268444",
            "0.005857019810508183",
            "0.023337222870478416",
            "0.18194532739987285",
            "0.286836744592104",
            "0.36240671641791045",
            "0.4151540598152574",
            "0.43344900929139135",
            "0.4328584716306848",
            "0.4293343587114415",
            "0.43105232892466927",
            "0.4292776214187774",
            "0.3880268139780273",
            "0.3810635305383486",
            "0.3646682922727653",
            "0.34260106091091996",
            "0.330638319109647",
            "0.2969816272965879",
            "0.2845329313737805",
            "0.276161906885299",
            "0.2646665244458235",
            "0.2587154225085259",
            "0.2587154225085259",
            "0.2587154225085259",
            "0.2587154225085259",
            "0.2587154225085259"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.25,
        "result_file": "sharegpt-reqrate++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "2457",
        "input_tokens": "354753",
        "output_tokens": "748443",
        "mean_ttft": "322.92",
        "median_ttft": "175.24",
        "p99_ttft": "4017.40",
        "hit_ratios": [
            "0.006757958385203629",
            "0.01837088388214905",
            "0.04817469578263045",
            "0.20491400491400488",
            "0.32939094803501584",
            "0.3765705311250714",
            "0.42847181871005224",
            "0.44770194653020234",
            "0.4658663704716336",
            "0.4739668015275834",
            "0.4710560447812137",
            "0.466969087030973",
            "0.45963236115767125",
            "0.4627520174368821",
            "0.450718759749454",
            "0.43411264612114764",
            "0.42782623210783294",
            "0.4216638223582259",
            "0.39345547871961223",
            "0.3773722503943151",
            "0.35819241701594645",
            "0.3575761445629271",
            "0.3575761445629271",
            "0.3575761445629271",
            "0.3575761445629271"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.5,
        "result_file": "sharegpt-reqrate++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "2999",
        "input_tokens": "357072",
        "output_tokens": "909117",
        "mean_ttft": "242.69",
        "median_ttft": "172.97",
        "p99_ttft": "1516.10",
        "hit_ratios": [
            "0.0363147276395427",
            "0.05521373056994819",
            "0.06686642485412396",
            "0.143838229683327",
            "0.2137977484845569",
            "0.2729320388349515",
            "0.30704446040347333",
            "0.3245268357662209",
            "0.34785830739587975",
            "0.34364509412314626",
            "0.3592737682687962",
            "0.38098270545649554",
            "0.3953252967700378",
            "0.40291929824561407",
            "0.4049659302085485",
            "0.41195096792765135",
            "0.40675844806007505",
            "0.4022193079794209",
            "0.40284538329981767",
            "0.40189250970177015",
            "0.3965846325355133",
            "0.39361397023676736",
            "0.38141779605712456",
            "0.3735149783930271",
            "0.3578759296962646",
            "0.3452346484878792",
            "0.34151696349007493",
            "0.33840231237530044",
            "0.33777539506267384",
            "0.33777539506267384",
            "0.33777539506267384"
        ],
        "args": " --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-reqrate++/client_logs/8002_lru.json"
    },
    {
        "num_requests": "4165",
        "input_tokens": "467383",
        "output_tokens": "1257400",
        "mean_ttft": "225.52",
        "median_ttft": "178.76",
        "p99_ttft": "1211.33",
        "hit_ratios": [
            "0.07262660804429247",
            "0.0759375",
            "0.08828370492293881",
            "0.0926312856943864",
            "0.1745565129244805",
            "0.22850142915475702",
            "0.25224144016943173",
            "0.26463028274254285",
            "0.2920960345292689",
            "0.30307256077720446",
            "0.32242158040856916",
            "0.34926566762584543",
            "0.35635481777504513",
            "0.3758625055390263",
            "0.370888952002272",
            "0.3769536837177852",
            "0.3597247374139804",
            "0.3572394198382329",
            "0.3610349813332181",
            "0.3583738400353511",
            "0.35226534123494535",
            "0.3446906432097389",
            "0.3443894269278379",
            "0.3378715211524245",
            "0.3304274282740224",
            "0.3300377924128142",
            "0.3289861559119039",
            "0.32714285714285707",
            "0.3243347860993233",
            "0.3250501448629373",
            "0.3311070741611455",
            "0.33154998080122877",
            "0.33134440614227517",
            "0.3311240428790199",
            "0.3353898394251348",
            "0.34013613384548924",
            "0.3378510282617719",
            "0.33295188273118625",
            "0.3333895269202402",
            "0.33400012502344184",
            "0.3345764296473276",
            "0.3345764296473276"
        ],
        "args": " --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 2,
        "result_file": "sharegpt-reqrate++/client_logs/8003_lru.json"
    },
    {
        "num_requests": "2540",
        "input_tokens": "427941",
        "output_tokens": "765805",
        "mean_ttft": "473.55",
        "median_ttft": "214.81",
        "p99_ttft": "9295.95",
        "hit_ratios": [
            "0.002655807365439094",
            "0.005685733976567884",
            "0.02317825579456395",
            "0.1390659555093014",
            "0.22460485251182924",
            "0.29991922455573505",
            "0.34266160726385686",
            "0.35187580853816297",
            "0.35423684892459173",
            "0.3645758122743681",
            "0.37302329362982223",
            "0.3636121064267742",
            "0.32391325679521143",
            "0.313410710906453",
            "0.29680459431600636",
            "0.2790340706630485",
            "0.272154757792363",
            "0.2370603505708837",
            "0.22789303115148035",
            "0.2192547373775912",
            "0.2085310916257742",
            "0.2015887814163073",
            "0.2015848660827004",
            "0.2015848660827004",
            "0.2015848660827004",
            "0.2015848660827004"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.25,
        "result_file": "sharegpt-reqrate++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "2456",
        "input_tokens": "354748",
        "output_tokens": "748229",
        "mean_ttft": "267.06",
        "median_ttft": "168.30",
        "p99_ttft": "1467.92",
        "hit_ratios": [
            "0.006402276364929753",
            "0.01785404749523314",
            "0.04666666666666667",
            "0.16813829125730628",
            "0.26128970531955603",
            "0.31385839534369697",
            "0.3668207248844563",
            "0.3965768940347344",
            "0.4105795726611555",
            "0.42101052126255156",
            "0.43174854918357786",
            "0.42535917034030013",
            "0.4172140363335109",
            "0.4165131560858927",
            "0.40766878980891724",
            "0.3936274969520774",
            "0.3816758544652702",
            "0.3727797144754317",
            "0.3418954494170741",
            "0.3257117278424352",
            "0.3080078683232738",
            "0.3078073285059056",
            "0.3078073285059056",
            "0.3078073285059056",
            "0.3078073285059056"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.5,
        "result_file": "sharegpt-reqrate++/client_logs/8001_lru.json"
    }
]