[
    {
        "num_requests": "4788",
        "input_tokens": "515839",
        "output_tokens": "1478328",
        "mean_ttft": "236.78",
        "median_ttft": "195.42",
        "p99_ttft": "1145.49",
        "hit_ratios": [
            "0.07484506594628954",
            "0.1287779237844941",
            "0.1410575858250277",
            "0.14406339308911406",
            "0.19419025324537137",
            "0.2251403887688985",
            "0.22347349177330897",
            "0.2562906510741739",
            "0.27797669792554713",
            "0.28983544049769233",
            "0.32736595500154725",
            "0.33938134441691326",
            "0.35330855018587376",
            "0.3575646980756471",
            "0.3529569812221991",
            "0.34808524995782486",
            "0.34965819548087457",
            "0.35711128572831746",
            "0.3429407791038055",
            "0.3378172478342258",
            "0.3338220607296912",
            "0.32261003360732066",
            "0.3196020014514341",
            "0.31780298858170863",
            "0.31604777886038027",
            "0.3124505996769648",
            "0.30833625160504935",
            "0.3053261866821188",
            "0.3082160059281215",
            "0.3024698723302708",
            "0.3031472081218274",
            "0.3094546903460837",
            "0.3097641250685682",
            "0.30987231392089687",
            "0.3035829776225584",
            "0.3062990266157803",
            "0.30997448669663447",
            "0.3110973312027473",
            "0.31179397131987097",
            "0.3209080047789723",
            "0.3266234416183812",
            "0.33220011295998586",
            "0.3322665423254628",
            "0.3374121865293612",
            "0.34056585445658927",
            "0.34159119072325905",
            "0.3406281439571273",
            "0.3412380659069908"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.03,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 3,
        "result_file": "sharegpt-reqrate+/client_logs/8002_lru.json"
    },
    {
        "num_requests": "5425",
        "input_tokens": "580658",
        "output_tokens": "1682011",
        "mean_ttft": "251.07",
        "median_ttft": "203.98",
        "p99_ttft": "1276.59",
        "hit_ratios": [
            "0.07928268050967437",
            "0.14793308447393888",
            "0.15557897510209456",
            "0.17971617323219966",
            "0.17819596299411267",
            "0.1876874228258952",
            "0.19285278878390735",
            "0.22373461012311902",
            "0.23294871020358845",
            "0.26766941614103185",
            "0.29514824797843664",
            "0.3090940873137264",
            "0.3143923031612017",
            "0.3267620751341683",
            "0.32153856024637506",
            "0.3199865513341689",
            "0.32429882494210494",
            "0.3114027172652041",
            "0.3060858455566203",
            "0.3041460247222356",
            "0.2945858087658334",
            "0.28797305414914603",
            "0.28593091128144404",
            "0.28449783006643486",
            "0.28486783964007384",
            "0.29185723854176626",
            "0.2888139487483555",
            "0.29112929155800077",
            "0.28864402655636273",
            "0.2932973155495525",
            "0.2957813447885754",
            "0.29742631797426317",
            "0.2920125353512192",
            "0.2919562183207229",
            "0.29738735002645544",
            "0.29738060720368215",
            "0.30118077727623027",
            "0.3086019480170048",
            "0.3164651381909548",
            "0.3183404370388493",
            "0.31687009535326055",
            "0.3164936077523793",
            "0.3169907119231567",
            "0.31768866510819394",
            "0.3199664052426747",
            "0.3248266842586484",
            "0.3226699546040464",
            "0.3233928591028329",
            "0.3288400983479274",
            "0.32905060291717125",
            "0.33149410587762085",
            "0.3287296690970275",
            "0.3291068045468898",
            "0.32933008621874804",
            "0.32933008621874804"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.04,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 4,
        "result_file": "sharegpt-reqrate+/client_logs/8003_lru.json"
    },
    {
        "num_requests": "4128",
        "input_tokens": "464689",
        "output_tokens": "1245935",
        "mean_ttft": "234.98",
        "median_ttft": "184.49",
        "p99_ttft": "1232.47",
        "hit_ratios": [
            "0.07273023104458186",
            "0.0763585259212992",
            "0.0889254222089374",
            "0.09487428809556886",
            "0.18296340731853628",
            "0.2398591887350988",
            "0.2604708458800985",
            "0.27847881454040285",
            "0.30459411703565115",
            "0.30661691989571166",
            "0.32502282742466954",
            "0.35503764790247405",
            "0.35853972232298925",
            "0.38155053377535825",
            "0.3702710835134175",
            "0.36695210910244225",
            "0.3552246434047299",
            "0.3512581567403594",
            "0.3551162935711169",
            "0.3537401840668352",
            "0.3475340026798334",
            "0.33974622097692436",
            "0.33903094150068025",
            "0.33006360515998895",
            "0.3250392672192588",
            "0.32261471119409835",
            "0.3217431070854293",
            "0.3205912334352701",
            "0.31796193442577764",
            "0.31814526936478155",
            "0.3237827137642038",
            "0.3245526532924471",
            "0.32315420952929036",
            "0.3242940517597123",
            "0.32855484152804443",
            "0.33506903618100575",
            "0.33246205642862514",
            "0.3283010999322316",
            "0.32764381100422924",
            "0.32883509228229874",
            "0.32899052113746347",
            "0.32899052113746347"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 2,
        "result_file": "sharegpt-reqrate+/client_logs/8001_lru.json"
    },
    {
        "num_requests": "2988",
        "input_tokens": "355242",
        "output_tokens": "909273",
        "mean_ttft": "246.82",
        "median_ttft": "185.16",
        "p99_ttft": "1512.09",
        "hit_ratios": [
            "0.036632498739707614",
            "0.05566343042071197",
            "0.06975648075412412",
            "0.14782276546982429",
            "0.2249091951825655",
            "0.29268667024787043",
            "0.32950411640819455",
            "0.33611499946161294",
            "0.35564044519901905",
            "0.3533460183798227",
            "0.36493553008595997",
            "0.3812903841869053",
            "0.3969096209912539",
            "0.40596072556049023",
            "0.40741104776882264",
            "0.4119326617784783",
            "0.40940174440031135",
            "0.4038826756699726",
            "0.4037691317408097",
            "0.4027936914470581",
            "0.3991954225634286",
            "0.3944496367089752",
            "0.3820316884686784",
            "0.373279768689705",
            "0.35720004725215604",
            "0.34459501654905406",
            "0.3407947994603215",
            "0.3374273335194244",
            "0.33728392066476626",
            "0.33728392066476626"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-reqrate+/client_logs/8000_lru.json"
    },
    {
        "num_requests": "2479",
        "input_tokens": "417556",
        "output_tokens": "749724",
        "mean_ttft": "295.10",
        "median_ttft": "207.53",
        "p99_ttft": "1475.92",
        "hit_ratios": [
            "0.0026790498303268444",
            "0.005864091065884788",
            "0.021877087508350036",
            "0.15992390615091948",
            "0.2679833478555522",
            "0.34244023595156775",
            "0.386813753951358",
            "0.39414062499999997",
            "0.3937986012617987",
            "0.39767779390420893",
            "0.4031979753824916",
            "0.39501407027924085",
            "0.3536532373207522",
            "0.3416019127316197",
            "0.32302521008403356",
            "0.30453975551144086",
            "0.29633187552139945",
            "0.25991053524602803",
            "0.24921355431225584",
            "0.2393003198769081",
            "0.23302614996849397",
            "0.22578494131992072",
            "0.22578494131992072",
            "0.22578494131992072",
            "0.22578494131992072"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.25,
        "result_file": "sharegpt-reqrate+/client_logs/8000_lru.json"
    },
    {
        "num_requests": "2411",
        "input_tokens": "347817",
        "output_tokens": "738010",
        "mean_ttft": "268.07",
        "median_ttft": "163.63",
        "p99_ttft": "1564.19",
        "hit_ratios": [
            "0.00705009276437848",
            "0.01837088388214905",
            "0.04828504828504829",
            "0.19668160348794964",
            "0.29063489108173524",
            "0.3447663684135776",
            "0.39551029854200415",
            "0.41503644035289605",
            "0.43309769184907587",
            "0.4378040043738924",
            "0.4484543102274275",
            "0.44093402475944965",
            "0.43183718985224423",
            "0.42819646569646574",
            "0.4195433964976164",
            "0.40138370062553874",
            "0.39134157547406223",
            "0.38215188137817563",
            "0.35163778209215746",
            "0.3342417061611374",
            "0.31826520759575144",
            "0.31826520759575144",
            "0.31826520759575144",
            "0.31826520759575144",
            "0.31826520759575144"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.5,
        "result_file": "sharegpt-reqrate+/client_logs/8001_lru.json"
    },
    {
        "num_requests": "2996",
        "input_tokens": "357292",
        "output_tokens": "911431",
        "mean_ttft": "244.88",
        "median_ttft": "176.73",
        "p99_ttft": "1522.33",
        "hit_ratios": [
            "0.036632498739707614",
            "0.05566343042071197",
            "0.06975648075412412",
            "0.14528494761052899",
            "0.22519594723762187",
            "0.2930703706545929",
            "0.3300834767093608",
            "0.3356153307099347",
            "0.3549879609083612",
            "0.3526622902990518",
            "0.36061381074168797",
            "0.3801681850035039",
            "0.39585764294049003",
            "0.40278150673897856",
            "0.40528959810874693",
            "0.4101021696705313",
            "0.4070925481016035",
            "0.4019994232432951",
            "0.4030294882136774",
            "0.4021959117587532",
            "0.398515686494996",
            "0.39321173288199107",
            "0.37970412665455483",
            "0.3714735946673359",
            "0.3554370721432332",
            "0.34292406743993786",
            "0.3391227336465842",
            "0.3356000243294204",
            "0.33504510082431926",
            "0.33504510082431926",
            "0.33504510082431926"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-reqrate+/client_logs/8002_lru.json"
    },
    {
        "num_requests": "4130",
        "input_tokens": "464583",
        "output_tokens": "1250030",
        "mean_ttft": "230.11",
        "median_ttft": "180.50",
        "p99_ttft": "1197.63",
        "hit_ratios": [
            "0.07273023104458186",
            "0.07647885125643827",
            "0.08917102315160567",
            "0.09170731707317076",
            "0.17904589371980678",
            "0.23600483286347163",
            "0.2599795291709315",
            "0.2799515933844293",
            "0.3050476636974529",
            "0.3089786351753359",
            "0.3261567741168076",
            "0.3523435529776275",
            "0.3589228030852398",
            "0.38022500685996546",
            "0.3680225247389428",
            "0.3660942100098137",
            "0.35378876194917247",
            "0.3496610206439519",
            "0.35305641816552386",
            "0.34417847567981613",
            "0.34328330588300604",
            "0.33543734714429574",
            "0.3359524688428342",
            "0.3264849138635546",
            "0.320765396770491",
            "0.3163638599403608",
            "0.31761062209181706",
            "0.31582921373926165",
            "0.31347286350189385",
            "0.3118092384923686",
            "0.3183551585506158",
            "0.31933794883247696",
            "0.3181176129709888",
            "0.3208589757271764",
            "0.3248095441776581",
            "0.3307333348362222",
            "0.3276801282259545",
            "0.32418465416732273",
            "0.3232723091169972",
            "0.32451459982853353",
            "0.32440116138398223",
            "0.32440116138398223"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 2,
        "result_file": "sharegpt-reqrate+/client_logs/8003_lru.json"
    },
    {
        "num_requests": "2515",
        "input_tokens": "423895",
        "output_tokens": "760694",
        "mean_ttft": "449.13",
        "median_ttft": "211.95",
        "p99_ttft": "8503.75",
        "hit_ratios": [
            "0.0026790498303268444",
            "0.005857019810508183",
            "0.023337222870478416",
            "0.15778766687857598",
            "0.26656319720632454",
            "0.33978544776119396",
            "0.38466507331567723",
            "0.3922905027932961",
            "0.3907349017705554",
            "0.39489874391181745",
            "0.3996933103316082",
            "0.38990924805531546",
            "0.34843129960317465",
            "0.3371411483253589",
            "0.31869116987897816",
            "0.3005827170817111",
            "0.2894973968762516",
            "0.254724409448819",
            "0.24493182916325296",
            "0.23609649477859637",
            "0.2263361735089079",
            "0.2212702375548495",
            "0.2212702375548495",
            "0.2212702375548495",
            "0.2212702375548495",
            "0.2212702375548495"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.25,
        "result_file": "sharegpt-reqrate+/client_logs/8000_lru.json"
    },
    {
        "num_requests": "2435",
        "input_tokens": "353179",
        "output_tokens": "745569",
        "mean_ttft": "287.54",
        "median_ttft": "169.83",
        "p99_ttft": "1795.75",
        "hit_ratios": [
            "0.006756756756756758",
            "0.01837088388214905",
            "0.04731756081306232",
            "0.18710385177961966",
            "0.28374964917204604",
            "0.33607613050944474",
            "0.3909927755767886",
            "0.4153094462540716",
            "0.4309931506849315",
            "0.4366453274745255",
            "0.4472259119239807",
            "0.4400385101389974",
            "0.43099300699300686",
            "0.42891647621026374",
            "0.41855160159439064",
            "0.40127050178180107",
            "0.38966518369989744",
            "0.3814301421503179",
            "0.35042064736917145",
            "0.33381419503750703",
            "0.31629541661317234",
            "0.3156613773557714",
            "0.3156613773557714",
            "0.3156613773557714",
            "0.3156613773557714"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.5,
        "result_file": "sharegpt-reqrate+/client_logs/8001_lru.json"
    },
    {
        "num_requests": "4155",
        "input_tokens": "467117",
        "output_tokens": "1254997",
        "mean_ttft": "231.42",
        "median_ttft": "184.23",
        "p99_ttft": "1235.17",
        "hit_ratios": [
            "0.07273023104458186",
            "0.07651467832604623",
            "0.0995366910775669",
            "0.12251701625225728",
            "0.21975604879024194",
            "0.2640557424315233",
            "0.28572406241445386",
            "0.31125331488527613",
            "0.3213283442469598",
            "0.32545095575697747",
            "0.3401881773790147",
            "0.367335962710649",
            "0.3764264807445655",
            "0.3920858933025123",
            "0.38520666356648514",
            "0.38569507274727954",
            "0.38292190148858596",
            "0.3802718565225929",
            "0.38362927314968476",
            "0.3766842979035559",
            "0.3723911528445146",
            "0.3723138876020099",
            "0.3753482864307607",
            "0.36622144226706965",
            "0.36152660824629945",
            "0.35817663296274266",
            "0.3573403942335981",
            "0.35450758912813274",
            "0.35332297410651664",
            "0.35424299965232275",
            "0.35765412145001163",
            "0.3554738873388317",
            "0.35622436005086017",
            "0.35977970509667323",
            "0.3635414395704008",
            "0.36935637197338256",
            "0.36582034820574033",
            "0.36443370381558526",
            "0.3643847793367477",
            "0.36416744892048974",
            "0.36412062206350326",
            "0.36412062206350326"
        ],
        "args": " --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 2,
        "result_file": "sharegpt-reqrate++/client_logs/8003_ml.json"
    },
    {
        "num_requests": "3011",
        "input_tokens": "358288",
        "output_tokens": "912522",
        "mean_ttft": "251.31",
        "median_ttft": "189.35",
        "p99_ttft": "1542.96",
        "hit_ratios": [
            "0.036632498739707614",
            "0.05398832684824903",
            "0.06972361809045227",
            "0.1523128034755942",
            "0.2467023513668515",
            "0.3151972872996301",
            "0.34926400305868865",
            "0.3552446035361754",
            "0.3675808820046422",
            "0.37878541852723885",
            "0.38021883098186016",
            "0.4018525002387243",
            "0.41448979591836743",
            "0.42798673158204487",
            "0.43292383292383285",
            "0.43746571585298955",
            "0.4346464108758855",
            "0.4343056594365494",
            "0.430595002054195",
            "0.4352030947775629",
            "0.4371683123733556",
            "0.43245934284766013",
            "0.4235512245601932",
            "0.4177701896116154",
            "0.40326272858834356",
            "0.38738705053904166",
            "0.38389276560258045",
            "0.380142635358044",
            "0.37940048164776796",
            "0.37940048164776796",
            "0.37940048164776796"
        ],
        "args": " --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-reqrate++/client_logs/8002_ml.json"
    },
    {
        "num_requests": "2516",
        "input_tokens": "425686",
        "output_tokens": "757799",
        "mean_ttft": "430.19",
        "median_ttft": "219.32",
        "p99_ttft": "9267.39",
        "hit_ratios": [
            "0.0026790498303268444",
            "0.005857019810508183",
            "0.023337222870478416",
            "0.18194532739987285",
            "0.286836744592104",
            "0.36240671641791045",
            "0.4151540598152574",
            "0.43344900929139135",
            "0.4328584716306848",
            "0.4293343587114415",
            "0.43105232892466927",
            "0.4292776214187774",
            "0.3880268139780273",
            "0.3810635305383486",
            "0.3646682922727653",
            "0.34260106091091996",
            "0.330638319109647",
            "0.2969816272965879",
            "0.2845329313737805",
            "0.276161906885299",
            "0.2646665244458235",
            "0.2587154225085259",
            "0.2587154225085259",
            "0.2587154225085259",
            "0.2587154225085259",
            "0.2587154225085259"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.25,
        "result_file": "sharegpt-reqrate++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "2457",
        "input_tokens": "354753",
        "output_tokens": "748443",
        "mean_ttft": "322.92",
        "median_ttft": "175.24",
        "p99_ttft": "4017.40",
        "hit_ratios": [
            "0.006757958385203629",
            "0.01837088388214905",
            "0.04817469578263045",
            "0.20491400491400488",
            "0.32939094803501584",
            "0.3765705311250714",
            "0.42847181871005224",
            "0.44770194653020234",
            "0.4658663704716336",
            "0.4739668015275834",
            "0.4710560447812137",
            "0.466969087030973",
            "0.45963236115767125",
            "0.4627520174368821",
            "0.450718759749454",
            "0.43411264612114764",
            "0.42782623210783294",
            "0.4216638223582259",
            "0.39345547871961223",
            "0.3773722503943151",
            "0.35819241701594645",
            "0.3575761445629271",
            "0.3575761445629271",
            "0.3575761445629271",
            "0.3575761445629271"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.5,
        "result_file": "sharegpt-reqrate++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "2999",
        "input_tokens": "357072",
        "output_tokens": "909117",
        "mean_ttft": "242.69",
        "median_ttft": "172.97",
        "p99_ttft": "1516.10",
        "hit_ratios": [
            "0.0363147276395427",
            "0.05521373056994819",
            "0.06686642485412396",
            "0.143838229683327",
            "0.2137977484845569",
            "0.2729320388349515",
            "0.30704446040347333",
            "0.3245268357662209",
            "0.34785830739587975",
            "0.34364509412314626",
            "0.3592737682687962",
            "0.38098270545649554",
            "0.3953252967700378",
            "0.40291929824561407",
            "0.4049659302085485",
            "0.41195096792765135",
            "0.40675844806007505",
            "0.4022193079794209",
            "0.40284538329981767",
            "0.40189250970177015",
            "0.3965846325355133",
            "0.39361397023676736",
            "0.38141779605712456",
            "0.3735149783930271",
            "0.3578759296962646",
            "0.3452346484878792",
            "0.34151696349007493",
            "0.33840231237530044",
            "0.33777539506267384",
            "0.33777539506267384",
            "0.33777539506267384"
        ],
        "args": " --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-reqrate++/client_logs/8002_lru.json"
    },
    {
        "num_requests": "4165",
        "input_tokens": "467383",
        "output_tokens": "1257400",
        "mean_ttft": "225.52",
        "median_ttft": "178.76",
        "p99_ttft": "1211.33",
        "hit_ratios": [
            "0.07262660804429247",
            "0.0759375",
            "0.08828370492293881",
            "0.0926312856943864",
            "0.1745565129244805",
            "0.22850142915475702",
            "0.25224144016943173",
            "0.26463028274254285",
            "0.2920960345292689",
            "0.30307256077720446",
            "0.32242158040856916",
            "0.34926566762584543",
            "0.35635481777504513",
            "0.3758625055390263",
            "0.370888952002272",
            "0.3769536837177852",
            "0.3597247374139804",
            "0.3572394198382329",
            "0.3610349813332181",
            "0.3583738400353511",
            "0.35226534123494535",
            "0.3446906432097389",
            "0.3443894269278379",
            "0.3378715211524245",
            "0.3304274282740224",
            "0.3300377924128142",
            "0.3289861559119039",
            "0.32714285714285707",
            "0.3243347860993233",
            "0.3250501448629373",
            "0.3311070741611455",
            "0.33154998080122877",
            "0.33134440614227517",
            "0.3311240428790199",
            "0.3353898394251348",
            "0.34013613384548924",
            "0.3378510282617719",
            "0.33295188273118625",
            "0.3333895269202402",
            "0.33400012502344184",
            "0.3345764296473276",
            "0.3345764296473276"
        ],
        "args": " --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 2,
        "result_file": "sharegpt-reqrate++/client_logs/8003_lru.json"
    },
    {
        "num_requests": "2540",
        "input_tokens": "427941",
        "output_tokens": "765805",
        "mean_ttft": "473.55",
        "median_ttft": "214.81",
        "p99_ttft": "9295.95",
        "hit_ratios": [
            "0.002655807365439094",
            "0.005685733976567884",
            "0.02317825579456395",
            "0.1390659555093014",
            "0.22460485251182924",
            "0.29991922455573505",
            "0.34266160726385686",
            "0.35187580853816297",
            "0.35423684892459173",
            "0.3645758122743681",
            "0.37302329362982223",
            "0.3636121064267742",
            "0.32391325679521143",
            "0.313410710906453",
            "0.29680459431600636",
            "0.2790340706630485",
            "0.272154757792363",
            "0.2370603505708837",
            "0.22789303115148035",
            "0.2192547373775912",
            "0.2085310916257742",
            "0.2015887814163073",
            "0.2015848660827004",
            "0.2015848660827004",
            "0.2015848660827004",
            "0.2015848660827004"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.25,
        "result_file": "sharegpt-reqrate++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "2456",
        "input_tokens": "354748",
        "output_tokens": "748229",
        "mean_ttft": "267.06",
        "median_ttft": "168.30",
        "p99_ttft": "1467.92",
        "hit_ratios": [
            "0.006402276364929753",
            "0.01785404749523314",
            "0.04666666666666667",
            "0.16813829125730628",
            "0.26128970531955603",
            "0.31385839534369697",
            "0.3668207248844563",
            "0.3965768940347344",
            "0.4105795726611555",
            "0.42101052126255156",
            "0.43174854918357786",
            "0.42535917034030013",
            "0.4172140363335109",
            "0.4165131560858927",
            "0.40766878980891724",
            "0.3936274969520774",
            "0.3816758544652702",
            "0.3727797144754317",
            "0.3418954494170741",
            "0.3257117278424352",
            "0.3080078683232738",
            "0.3078073285059056",
            "0.3078073285059056",
            "0.3078073285059056",
            "0.3078073285059056"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 0.5,
        "result_file": "sharegpt-reqrate++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3018",
        "input_tokens": "358689",
        "output_tokens": "913183",
        "mean_ttft": "732.57",
        "median_ttft": "187.03",
        "p99_ttft": "9214.79",
        "hit_ratios": [
            "0.025931336742147554",
            "0.046029737424865554",
            "0.04699017199017198",
            "0.0980872976949485",
            "0.14010885885885888",
            "0.18261465793082432",
            "0.19431725522172744",
            "0.19704066425377903",
            "0.2051066610652103",
            "0.20933680625125228",
            "0.2145691609977325",
            "0.2188827694728561",
            "0.22458217270194994",
            "0.2431003798443436",
            "0.2527362454803089",
            "0.257619425848179",
            "0.2565369149435612",
            "0.25992105112607033",
            "0.2588460991899957",
            "0.25533907517350946",
            "0.2563283047813858",
            "0.24692624496507606",
            "0.23694389335312496",
            "0.23491262835525129",
            "0.22534601508691376",
            "0.21879586981829224",
            "0.2135042276858598",
            "0.2113663466518906",
            "0.2110045431600202",
            "0.2110045431600202",
            "0.2110045431600202"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3007",
        "input_tokens": "358189",
        "output_tokens": "911554",
        "mean_ttft": "3023.12",
        "median_ttft": "192.40",
        "p99_ttft": "21627.21",
        "hit_ratios": [
            "0.027013251783893986",
            "0.04838467317806161",
            "0.05396685731045608",
            "0.06130408287629494",
            "0.09202397418165052",
            "0.11421072365954255",
            "0.11469095799963318",
            "0.11411808235107562",
            "0.11918253599628424",
            "0.11897067624177138",
            "0.1191377497371188",
            "0.12487490617963472",
            "0.12699099722991686",
            "0.13940525333263215",
            "0.14327115094247722",
            "0.1476981233967868",
            "0.1495306213679034",
            "0.15024930537053247",
            "0.15183869248534373",
            "0.15137299579472915",
            "0.1499192348905273",
            "0.14354807215705123",
            "0.13733363928407527",
            "0.13537608318890815",
            "0.13100765964202088",
            "0.12692960888190413",
            "0.12529637956240255",
            "0.12522760433623947",
            "0.12404550598606236",
            "0.12404550598606236",
            "0.12404550598606236"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3022",
        "input_tokens": "358774",
        "output_tokens": "914288",
        "mean_ttft": "666.49",
        "median_ttft": "184.33",
        "p99_ttft": "8407.53",
        "hit_ratios": [
            "0.02983445515735856",
            "0.04997635188396659",
            "0.05081891933261901",
            "0.10125801677355697",
            "0.1427367237988199",
            "0.18468091579828094",
            "0.19475068905036327",
            "0.1973523313307459",
            "0.20616489460921467",
            "0.2099615631005765",
            "0.21515944283391072",
            "0.21872444807849548",
            "0.22444541104828186",
            "0.24338020695144602",
            "0.25260664664371346",
            "0.2574740280361112",
            "0.2564065943034359",
            "0.25979794128860084",
            "0.25873182165243186",
            "0.2552327136552094",
            "0.2562263367254023",
            "0.2476171804307174",
            "0.23777701622115618",
            "0.235546750529918",
            "0.22629785002621933",
            "0.21894771473401842",
            "0.21448590159140216",
            "0.21235963178948397",
            "0.2117774176121017",
            "0.2117774176121017",
            "0.2117774176121017"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3018",
        "input_tokens": "358722",
        "output_tokens": "914316",
        "mean_ttft": "3391.12",
        "median_ttft": "197.97",
        "p99_ttft": "24038.45",
        "hit_ratios": [
            "0.026826775677056717",
            "0.04607946819761293",
            "0.0517470145953118",
            "0.058024237972824085",
            "0.0856693496160607",
            "0.10910594781562523",
            "0.11040990135408367",
            "0.11041677699518085",
            "0.1183429207645203",
            "0.11606536417755402",
            "0.11648066259563414",
            "0.12326236693800874",
            "0.12524552281917964",
            "0.13842915405867648",
            "0.14451499890518937",
            "0.148705396240821",
            "0.15113043124987305",
            "0.15129165320204538",
            "0.15273417407190623",
            "0.15212183149323996",
            "0.1504272139263755",
            "0.1440789868555309",
            "0.1378033260406389",
            "0.1360769124360216",
            "0.13119852408249325",
            "0.12848344103392567",
            "0.12588936920608873",
            "0.12543390787340097",
            "0.12434392142459387",
            "0.12434392142459387",
            "0.12434392142459387"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3012",
        "input_tokens": "358308",
        "output_tokens": "912820",
        "mean_ttft": "535.96",
        "median_ttft": "189.88",
        "p99_ttft": "6737.25",
        "hit_ratios": [
            "0.021903052064631955",
            "0.042188739095955594",
            "0.0422339108910891",
            "0.06210869020786376",
            "0.092121677382209",
            "0.13002197112366604",
            "0.14512961508248234",
            "0.1497376939390557",
            "0.15135962098405958",
            "0.15528499810422547",
            "0.1599298978298158",
            "0.16001329566229017",
            "0.17005409700785476",
            "0.18522131787267254",
            "0.19172102100559807",
            "0.19281577561862825",
            "0.18871274843292046",
            "0.18638596491228074",
            "0.1847047218448138",
            "0.18311195445920303",
            "0.18145397857753487",
            "0.17662699417574065",
            "0.168717733221275",
            "0.16464463822217032",
            "0.15673004324250117",
            "0.15217563291139233",
            "0.1508148526874161",
            "0.14925599373468404",
            "0.14906840128079063",
            "0.14906840128079063",
            "0.14906840128079063"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3001",
        "input_tokens": "358013",
        "output_tokens": "909684",
        "mean_ttft": "2343.50",
        "median_ttft": "193.39",
        "p99_ttft": "19123.54",
        "hit_ratios": [
            "0.012826837691169215",
            "0.03503380454824831",
            "0.04098115465151062",
            "0.044408508520960316",
            "0.061861467803917894",
            "0.06826200337475072",
            "0.07258834765998087",
            "0.0723303379458625",
            "0.0704449920278301",
            "0.07517122568175132",
            "0.07447754557581146",
            "0.07216323822163236",
            "0.0706938127651781",
            "0.07860286335023117",
            "0.08531547481589818",
            "0.08890418763650174",
            "0.084637482313596",
            "0.08378090237965923",
            "0.07965380940784172",
            "0.07724215840290892",
            "0.075699164722194",
            "0.07321876687525805",
            "0.0699786889953599",
            "0.06844998167827039",
            "0.06513314164270531",
            "0.06467601384567725",
            "0.06317698885721686",
            "0.0631291070004178",
            "0.06290312441063681",
            "0.06290312441063681",
            "0.06290312441063681"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3023",
        "input_tokens": "358839",
        "output_tokens": "914626",
        "mean_ttft": "499.37",
        "median_ttft": "182.18",
        "p99_ttft": "6463.34",
        "hit_ratios": [
            "0.022003577817531306",
            "0.04235406091370558",
            "0.04238861386138613",
            "0.05975197294250282",
            "0.09095224532421912",
            "0.13099759708549724",
            "0.14422146221849388",
            "0.14722784740846148",
            "0.14892277898813847",
            "0.15275110628705016",
            "0.15626273478309188",
            "0.1586086267779941",
            "0.16976955730745905",
            "0.18615150256197197",
            "0.19304232669485047",
            "0.19420823885109598",
            "0.1891114425740464",
            "0.18727431451132892",
            "0.18545582359035073",
            "0.1835275238959045",
            "0.1816391582249962",
            "0.17732470778039633",
            "0.16990218659328166",
            "0.16561202867841276",
            "0.1579842303736715",
            "0.15371043345446883",
            "0.1518295318737763",
            "0.1505129980487191",
            "0.14987853439855744",
            "0.14987853439855744",
            "0.14987853439855744"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3009",
        "input_tokens": "358165",
        "output_tokens": "911719",
        "mean_ttft": "2477.27",
        "median_ttft": "188.22",
        "p99_ttft": "19688.09",
        "hit_ratios": [
            "0.012738853503184714",
            "0.034728541097967844",
            "0.04061438487667996",
            "0.04397494165335954",
            "0.06288315065948356",
            "0.07230018303843809",
            "0.07623630722471983",
            "0.07370266863937752",
            "0.07163117157828951",
            "0.07473916115891427",
            "0.07358338226658838",
            "0.0712012337172294",
            "0.0687550977252817",
            "0.07663901672775376",
            "0.08363886342804767",
            "0.08625813756014718",
            "0.08219936540386294",
            "0.08140649335090454",
            "0.07679985098258359",
            "0.074808003945607",
            "0.07324180914680366",
            "0.07144104803493448",
            "0.06848089751364461",
            "0.06676725211302677",
            "0.06350749066270496",
            "0.0620611400347083",
            "0.06117406602504396",
            "0.061235350015837804",
            "0.06081597374453531",
            "0.06081597374453531",
            "0.06081597374453531"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3015",
        "input_tokens": "358688",
        "output_tokens": "912644",
        "mean_ttft": "242.44",
        "median_ttft": "178.37",
        "p99_ttft": "1504.56",
        "hit_ratios": [
            "0.03665097511768661",
            "0.05566343042071197",
            "0.06899810964083175",
            "0.14840499306518726",
            "0.22078045987978248",
            "0.2685498768472906",
            "0.2973675864256264",
            "0.30114092881246984",
            "0.3041500852757249",
            "0.3080353523068191",
            "0.3127728085867621",
            "0.32277277911544805",
            "0.3337616822429907",
            "0.3501011930123563",
            "0.3566874294962971",
            "0.3610270184144039",
            "0.35842352460690224",
            "0.3568110123315172",
            "0.35140658598567664",
            "0.3552404418296711",
            "0.35924675615570467",
            "0.35392196876936804",
            "0.3431337499463743",
            "0.33978050032605844",
            "0.32723334427305556",
            "0.3143840656531011",
            "0.3107337039525933",
            "0.30829517649053945",
            "0.30704598878910244",
            "0.30704598878910244",
            "0.30704598878910244"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3021",
        "input_tokens": "358756",
        "output_tokens": "914135",
        "mean_ttft": "239.17",
        "median_ttft": "172.29",
        "p99_ttft": "1487.41",
        "hit_ratios": [
            "0.03663865546218487",
            "0.05566343042071197",
            "0.06899810964083175",
            "0.16151809355692853",
            "0.24942813572245523",
            "0.3166460968836779",
            "0.3538247037201344",
            "0.35805379916407676",
            "0.3782868432193423",
            "0.38788269936670566",
            "0.3905374040349939",
            "0.40639817917430615",
            "0.41939238738214424",
            "0.4313323572474379",
            "0.4406949712467882",
            "0.4423347398030943",
            "0.4377185627517946",
            "0.4361917108323485",
            "0.4340028057464529",
            "0.43827666371193",
            "0.44000639590661983",
            "0.4354424257081532",
            "0.42638593283528786",
            "0.4213185322573948",
            "0.40668825572588857",
            "0.3931818747975986",
            "0.3871223004066129",
            "0.3839731077857297",
            "0.382272896210241",
            "0.382272896210241",
            "0.382272896210241"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3026",
        "input_tokens": "359255",
        "output_tokens": "915266",
        "mean_ttft": "242.35",
        "median_ttft": "178.42",
        "p99_ttft": "1514.62",
        "hit_ratios": [
            "0.03617701497560155",
            "0.05566343042071197",
            "0.06899810964083175",
            "0.14722222222222225",
            "0.22068504913653278",
            "0.26918345379055825",
            "0.2978008745801382",
            "0.2977868281442581",
            "0.3029775624441415",
            "0.3058771328304628",
            "0.31236635780470434",
            "0.3218056521464248",
            "0.33331393318589236",
            "0.3454909819639281",
            "0.35661926403753136",
            "0.3609636586361782",
            "0.3571194896540445",
            "0.35676974110649345",
            "0.35205014827837283",
            "0.35532103493836886",
            "0.35958521075000816",
            "0.3526104174854139",
            "0.34337246165709906",
            "0.33956015021964797",
            "0.3284623744615105",
            "0.31585581987469125",
            "0.3111216706874286",
            "0.30847686755422526",
            "0.306655958959115",
            "0.306655958959115",
            "0.306655958959115"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3022",
        "input_tokens": "358806",
        "output_tokens": "915186",
        "mean_ttft": "235.73",
        "median_ttft": "173.35",
        "p99_ttft": "1502.71",
        "hit_ratios": [
            "0.036644814254496554",
            "0.05566343042071197",
            "0.06899810964083175",
            "0.16151809355692853",
            "0.24968991508443855",
            "0.3166088631984586",
            "0.35041048813084713",
            "0.3552914605291461",
            "0.37177972110612145",
            "0.38234698424271873",
            "0.38572142143570715",
            "0.4045282779206757",
            "0.4187749861390761",
            "0.4325941289087428",
            "0.43892212632404864",
            "0.44131637042263144",
            "0.4376225089839923",
            "0.4351665997591331",
            "0.43221920144997084",
            "0.4374612432332781",
            "0.43923275048393046",
            "0.4359346423011231",
            "0.42565422565422567",
            "0.42134051532652167",
            "0.406632105359621",
            "0.3921109060988382",
            "0.38655421157343567",
            "0.3836660266396167",
            "0.3814546807310606",
            "0.3814546807310606",
            "0.3814546807310606"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3017",
        "input_tokens": "358641",
        "output_tokens": "913639",
        "mean_ttft": "239.02",
        "median_ttft": "174.66",
        "p99_ttft": "1497.61",
        "hit_ratios": [
            "0.035828427249789734",
            "0.05165155440414508",
            "0.0514520202020202",
            "0.09895833333333334",
            "0.16484895280378342",
            "0.2143642935722144",
            "0.23761988647484827",
            "0.24549574444567254",
            "0.2525709786940904",
            "0.2570069859439441",
            "0.2590078328981723",
            "0.27075249560574394",
            "0.2850949502350858",
            "0.2993676704086465",
            "0.30350553505535055",
            "0.3092911579903003",
            "0.3112882147524478",
            "0.30387149752648773",
            "0.29811482114969895",
            "0.29926597127102883",
            "0.29586454798938433",
            "0.2935388807909247",
            "0.2810430091413158",
            "0.2755382002409744",
            "0.26460476373837954",
            "0.25478164371042505",
            "0.2523596367821974",
            "0.2499715135785277",
            "0.24875991439002906",
            "0.24875991439002906",
            "0.24875991439002906"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3021",
        "input_tokens": "358787",
        "output_tokens": "914101",
        "mean_ttft": "235.88",
        "median_ttft": "172.91",
        "p99_ttft": "1499.32",
        "hit_ratios": [
            "0.03632083403396671",
            "0.05521373056994819",
            "0.06691919191919192",
            "0.14033303673573155",
            "0.2083212385099178",
            "0.26584963469243467",
            "0.30638074627844447",
            "0.3223190981285055",
            "0.34281776114994583",
            "0.33917708685366676",
            "0.3510729935208419",
            "0.3762633843690583",
            "0.3923020212569884",
            "0.4026736315892942",
            "0.4044880207931238",
            "0.4082988742022611",
            "0.40583310135120665",
            "0.3999278325715659",
            "0.40028772139600916",
            "0.4008974133380256",
            "0.3984089877058139",
            "0.3914658250446313",
            "0.3815598986608757",
            "0.3742313408912072",
            "0.3582297131683671",
            "0.3455389578879721",
            "0.3403871033855533",
            "0.33704375166398304",
            "0.3353420236504373",
            "0.3353420236504373",
            "0.3353420236504373"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3030",
        "input_tokens": "359317",
        "output_tokens": "916226",
        "mean_ttft": "240.62",
        "median_ttft": "178.20",
        "p99_ttft": "1516.85",
        "hit_ratios": [
            "0.03585858585858586",
            "0.05165155440414508",
            "0.051443900899479256",
            "0.10231733569710016",
            "0.16316655375979872",
            "0.21092102179517228",
            "0.23367764568310273",
            "0.24120105587329518",
            "0.2546444898356191",
            "0.255063264709567",
            "0.25474947228085765",
            "0.2654893449092344",
            "0.2803684513529073",
            "0.29588646988851697",
            "0.3015045852811199",
            "0.30694078869365204",
            "0.3081696409466342",
            "0.302717152775007",
            "0.298996469057796",
            "0.29983505299361274",
            "0.29692059977860524",
            "0.29242508544630796",
            "0.28198347107438027",
            "0.27622861303239904",
            "0.26566547258197853",
            "0.2561065293901349",
            "0.2522826670758842",
            "0.24972807527888086",
            "0.24819488918189228",
            "0.24819488918189228",
            "0.24819488918189228"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3025",
        "input_tokens": "359283",
        "output_tokens": "915346",
        "mean_ttft": "236.24",
        "median_ttft": "170.53",
        "p99_ttft": "1498.47",
        "hit_ratios": [
            "0.03632694248234107",
            "0.05521373056994819",
            "0.06692975532754539",
            "0.14349149961938598",
            "0.20971472629144178",
            "0.26683958185962425",
            "0.3051456183884027",
            "0.32082779991146515",
            "0.34307285027943907",
            "0.3392053815429891",
            "0.35179250204963836",
            "0.37381530378105143",
            "0.38955123502078737",
            "0.3999443981095357",
            "0.4027930813581037",
            "0.4078887857363897",
            "0.4054833746474058",
            "0.4003440550488078",
            "0.40244129358788283",
            "0.4017085021663245",
            "0.39934988773834645",
            "0.3928334019182677",
            "0.38200612097935654",
            "0.37490927038875815",
            "0.3589219865933734",
            "0.3462276089707627",
            "0.3412049729040484",
            "0.3377396569122098",
            "0.3357184030475425",
            "0.3357184030475425",
            "0.3357184030475425"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3035",
        "input_tokens": "359939",
        "output_tokens": "917570",
        "mean_ttft": "2810.84",
        "median_ttft": "177.66",
        "p99_ttft": "19501.59",
        "hit_ratios": [
            "0.014138509465612268",
            "0.0466374269005848",
            "0.052061046926258736",
            "0.08105538388400285",
            "0.12331596910364648",
            "0.1590792463895609",
            "0.16489329360977684",
            "0.17139399042256476",
            "0.16784145001830827",
            "0.1816235079509854",
            "0.1767822060061745",
            "0.1878532396565183",
            "0.19376073268460212",
            "0.191339826270071",
            "0.1929636487671767",
            "0.1961493529834651",
            "0.19477834309691278",
            "0.19020596889449343",
            "0.19259022676461188",
            "0.19362847892096824",
            "0.19017814155031287",
            "0.18519352610875892",
            "0.17630594350669745",
            "0.172985221948812",
            "0.16584538759073797",
            "0.16172903782905168",
            "0.16034831667382096",
            "0.1590436841596597",
            "0.15726732485735245",
            "0.156732969962955",
            "0.156732969962955"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 3,
        "use_token_id": 1,
        "algorithm": "ml-true",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml-true.json"
    },
    {
        "num_requests": "3046",
        "input_tokens": "360151",
        "output_tokens": "919135",
        "mean_ttft": "448.33",
        "median_ttft": "160.00",
        "p99_ttft": "5173.30",
        "hit_ratios": [
            "0.022840302081414625",
            "0.04420852479797179",
            "0.04429012345679012",
            "0.12879439596903036",
            "0.2059487951807229",
            "0.2519853390348198",
            "0.27810948400477653",
            "0.29411450259261235",
            "0.31059791501098605",
            "0.3052200778397465",
            "0.30618047410882476",
            "0.32419243120710284",
            "0.33953880111524165",
            "0.34935324709961335",
            "0.3507207937326555",
            "0.34940225435500405",
            "0.3441802508477347",
            "0.3406551354660952",
            "0.33871456317599474",
            "0.3332269122193844",
            "0.32971601945643975",
            "0.32266095854017707",
            "0.3118945256520492",
            "0.30804012410089454",
            "0.2969821133086438",
            "0.28854820741340886",
            "0.2819326493544745",
            "0.2781750208703858",
            "0.2753191794577536",
            "0.2753191794577536",
            "0.2753191794577536"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 3,
        "use_token_id": 1,
        "algorithm": "ml-true",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml-true.json"
    },
    {
        "num_requests": "3051",
        "input_tokens": "360304",
        "output_tokens": "920664",
        "mean_ttft": "217.90",
        "median_ttft": "151.03",
        "p99_ttft": "1463.91",
        "hit_ratios": [
            "0.036884542803225256",
            "0.05569046462684151",
            "0.06880733944954129",
            "0.1981261711430356",
            "0.3171940526115135",
            "0.3962786406274027",
            "0.4332340452500158",
            "0.4552274797706446",
            "0.4702949339103437",
            "0.46960590536888375",
            "0.4621875667592394",
            "0.46905054709425137",
            "0.48338552540013907",
            "0.4882803125249991",
            "0.49135868769223234",
            "0.4875465021322927",
            "0.4783070946636679",
            "0.46793625376491654",
            "0.46291396608363655",
            "0.4686867334816871",
            "0.46519690071091935",
            "0.4590888451642197",
            "0.4449285091916752",
            "0.4406338301290929",
            "0.4269321058084482",
            "0.41299737743591025",
            "0.40598489677830624",
            "0.4019641125121241",
            "0.3952758153143508",
            "0.3952758153143508",
            "0.3952758153143508"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 3,
        "use_token_id": 1,
        "algorithm": "ml-true",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml-true.json"
    },
    {
        "num_requests": "3052",
        "input_tokens": "360293",
        "output_tokens": "921229",
        "mean_ttft": "213.41",
        "median_ttft": "141.55",
        "p99_ttft": "1508.11",
        "hit_ratios": [
            "0.03617701497560155",
            "0.05567243890597183",
            "0.06919431279620852",
            "0.19812617114303557",
            "0.3171940526115135",
            "0.40304474857757955",
            "0.4593446986501045",
            "0.4949630264709034",
            "0.5256126816877555",
            "0.5378564801742566",
            "0.5420460632029993",
            "0.5539293165581335",
            "0.5663485042486321",
            "0.5776490375630722",
            "0.584149446675154",
            "0.585111956447461",
            "0.5734777278299957",
            "0.5665997130559537",
            "0.5668780731133753",
            "0.564437960121413",
            "0.5589630199320641",
            "0.55311310886406",
            "0.543665683269842",
            "0.5401323180626636",
            "0.527878596601967",
            "0.5139518813995853",
            "0.5062077095946258",
            "0.5008371551284849",
            "0.491930883681133",
            "0.491930883681133",
            "0.491930883681133"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 3,
        "use_token_id": 1,
        "algorithm": "ml-true",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml-true.json"
    }
]