[
    {
        "num_requests": "3013",
        "input_tokens": "358639",
        "output_tokens": "912570",
        "mean_ttft": "734.46",
        "median_ttft": "184.46",
        "p99_ttft": "9490.24",
        "hit_ratios": [
            "0.02777777777777778",
            "0.04695652173913044",
            "0.047889485801995396",
            "0.09866405196715282",
            "0.14166432123088468",
            "0.18402010815751388",
            "0.19540950708641663",
            "0.1984846867997012",
            "0.20689816111266687",
            "0.2109944707107941",
            "0.21653027243419418",
            "0.220020756675158",
            "0.22575216874111467",
            "0.24416998671978746",
            "0.253719311102968",
            "0.2585095761096487",
            "0.25815920905106515",
            "0.26067887109077037",
            "0.2595427982735038",
            "0.25599518378541075",
            "0.2570510874254941",
            "0.24842359330215716",
            "0.23837458251263163",
            "0.23571319666791404",
            "0.2265670076055599",
            "0.2195313390133053",
            "0.2141010633108965",
            "0.21193633952254642",
            "0.21164097565671514",
            "0.21164097565671514",
            "0.21164097565671514"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3001",
        "input_tokens": "358075",
        "output_tokens": "910634",
        "mean_ttft": "3480.03",
        "median_ttft": "201.97",
        "p99_ttft": "25377.07",
        "hit_ratios": [
            "0.023378582202111614",
            "0.05526973394090842",
            "0.06050179211469534",
            "0.06751256882930334",
            "0.0941622989336707",
            "0.11378169790518192",
            "0.11071842057156783",
            "0.10913692202246006",
            "0.1157161195672107",
            "0.11562760758135653",
            "0.11688857743517869",
            "0.12346026386544112",
            "0.12592253561416558",
            "0.13647571083831705",
            "0.14019031016198152",
            "0.1447769216986203",
            "0.14820734865652313",
            "0.14796442011631886",
            "0.1491373824506823",
            "0.14941895411741132",
            "0.14787359810844491",
            "0.14002448711440263",
            "0.13346181642977603",
            "0.1329736459846442",
            "0.12782577819860344",
            "0.12380880255468467",
            "0.1231108119684269",
            "0.12152886115444621",
            "0.12057748017286417",
            "0.12057748017286417",
            "0.12057748017286417"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3013",
        "input_tokens": "358671",
        "output_tokens": "913450",
        "mean_ttft": "441.36",
        "median_ttft": "181.90",
        "p99_ttft": "5646.13",
        "hit_ratios": [
            "0.02204301075268817",
            "0.04323040380047506",
            "0.043236565781346506",
            "0.06276516096830546",
            "0.09228860469555257",
            "0.12862972845707107",
            "0.14046626725709818",
            "0.14558684663667165",
            "0.1481682362802623",
            "0.15423412732050518",
            "0.1581878386514148",
            "0.159755565255347",
            "0.17219033512312534",
            "0.1900803235409762",
            "0.1977009113504556",
            "0.1971180446967692",
            "0.19307934590326617",
            "0.19011629078743172",
            "0.1879306470940683",
            "0.1851792969440028",
            "0.1823387328344847",
            "0.17729420780381885",
            "0.16906474820143885",
            "0.16475281211961224",
            "0.15683807364185665",
            "0.15184722185280733",
            "0.15019167931664387",
            "0.14887980334466897",
            "0.1484441399956869",
            "0.1484441399956869",
            "0.1484441399956869"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "2998",
        "input_tokens": "357007",
        "output_tokens": "909594",
        "mean_ttft": "2626.97",
        "median_ttft": "195.11",
        "p99_ttft": "20442.15",
        "hit_ratios": [
            "0.012852199703410774",
            "0.03512014787430684",
            "0.0411041104110411",
            "0.04439194230290972",
            "0.06312634635197154",
            "0.06675332619666616",
            "0.07216363867361199",
            "0.07123212321232122",
            "0.07083152147654248",
            "0.07442836165303122",
            "0.0734305973196718",
            "0.07106565270813267",
            "0.06873335985555588",
            "0.07605453176837937",
            "0.08340633857253284",
            "0.0867957830463197",
            "0.0816453925135071",
            "0.08173744940494171",
            "0.07755140362407285",
            "0.07514000141773587",
            "0.07372278874051953",
            "0.07141945976974837",
            "0.06833598907352605",
            "0.06680872951723121",
            "0.06362355828905342",
            "0.06157476936279766",
            "0.06071990328493243",
            "0.06085715014149859",
            "0.06096017015673662",
            "0.06096017015673662"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3018",
        "input_tokens": "358689",
        "output_tokens": "913724",
        "mean_ttft": "234.99",
        "median_ttft": "174.92",
        "p99_ttft": "1479.38",
        "hit_ratios": [
            "0.036644814254496554",
            "0.05566343042071197",
            "0.06899810964083175",
            "0.16151809355692853",
            "0.24968991508443855",
            "0.3182377364293404",
            "0.3538247037201344",
            "0.3581265741385778",
            "0.37527635354438127",
            "0.38497841958775364",
            "0.3877521871094448",
            "0.4058291711449706",
            "0.4188976836223956",
            "0.43034971745388634",
            "0.4396471680594243",
            "0.4419944648609409",
            "0.4374118080124338",
            "0.4357151027567011",
            "0.43355885852289877",
            "0.43763500276284734",
            "0.4401641831568524",
            "0.4352733206418275",
            "0.4262297422717212",
            "0.4211691456243513",
            "0.4065004568594177",
            "0.39282820854781825",
            "0.386469607138944",
            "0.3833409644070656",
            "0.38152027998849364",
            "0.38152027998849364",
            "0.38152027998849364"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3022",
        "input_tokens": "358793",
        "output_tokens": "915029",
        "mean_ttft": "244.47",
        "median_ttft": "182.37",
        "p99_ttft": "1500.92",
        "hit_ratios": [
            "0.036644814254496554",
            "0.05566343042071197",
            "0.06975648075412412",
            "0.1419658772599949",
            "0.21840948193462056",
            "0.2695879057631801",
            "0.2932541961835471",
            "0.2960051685151287",
            "0.29786832673080554",
            "0.3033612080863846",
            "0.30691260744985666",
            "0.3201194333269805",
            "0.33332361516034986",
            "0.34850997806430895",
            "0.3532533909966581",
            "0.36020347371797795",
            "0.3574587445231562",
            "0.3564008525509322",
            "0.35130307414750905",
            "0.3547556975864099",
            "0.35830304589752654",
            "0.3525621634702643",
            "0.3424025526043464",
            "0.33753019239845633",
            "0.3259880710493543",
            "0.31390587941580317",
            "0.31060940334362885",
            "0.3074852695133482",
            "0.3058812188979792",
            "0.3058812188979792",
            "0.3058812188979792"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3020",
        "input_tokens": "358726",
        "output_tokens": "913591",
        "mean_ttft": "238.09",
        "median_ttft": "177.01",
        "p99_ttft": "1513.18",
        "hit_ratios": [
            "0.035828427249789734",
            "0.05165155440414508",
            "0.051476393494394444",
            "0.10549589387239418",
            "0.1688923047362859",
            "0.21264951919318267",
            "0.2355731739017416",
            "0.24445062586926286",
            "0.2576947779259918",
            "0.2598187311178248",
            "0.2595402559166573",
            "0.26965234348732436",
            "0.284225177853387",
            "0.2997826639193881",
            "0.3056635058811337",
            "0.3109433599384556",
            "0.3110711422194292",
            "0.3037220943845626",
            "0.300110721189033",
            "0.30072412575061813",
            "0.296886093924333",
            "0.2929473852550775",
            "0.28175376573146593",
            "0.27601604591239154",
            "0.2649157746245124",
            "0.2562032529977441",
            "0.25283140283140265",
            "0.2506374623897188",
            "0.24939172749391708",
            "0.24939172749391708",
            "0.24939172749391708"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3023",
        "input_tokens": "358866",
        "output_tokens": "915146",
        "mean_ttft": "239.03",
        "median_ttft": "174.99",
        "p99_ttft": "1507.92",
        "hit_ratios": [
            "0.03632083403396671",
            "0.05521373056994819",
            "0.06686642485412396",
            "0.14107936507936508",
            "0.21376565382001747",
            "0.2696788413098237",
            "0.3049603174603176",
            "0.32330151600224605",
            "0.34727534648055247",
            "0.34172615739751216",
            "0.35576959395656294",
            "0.3770945011968579",
            "0.3921623382667785",
            "0.4011660817389337",
            "0.4029061743183772",
            "0.4110604195331547",
            "0.4062168309325246",
            "0.4023987520006483",
            "0.40333872849776037",
            "0.4034885576019712",
            "0.39833071451501173",
            "0.3931675827687587",
            "0.3810591371788656",
            "0.37297494704550427",
            "0.3572613190336667",
            "0.34523402352074495",
            "0.34092724789320406",
            "0.33734755514776144",
            "0.33543109670393667",
            "0.33543109670393667",
            "0.33543109670393667"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3016",
        "input_tokens": "358660",
        "output_tokens": "912749",
        "mean_ttft": "738.24",
        "median_ttft": "185.17",
        "p99_ttft": "9487.82",
        "hit_ratios": [
            "0.025907681080094877",
            "0.045361150624308524",
            "0.046340340647537205",
            "0.09737134394668641",
            "0.14088734640277645",
            "0.1832305231893991",
            "0.19306496112365182",
            "0.1959772255627095",
            "0.20463879036774307",
            "0.20857371794871787",
            "0.21424775939636545",
            "0.21729280724938643",
            "0.22327308596129855",
            "0.24189950069053434",
            "0.25163055426631165",
            "0.2565690946221919",
            "0.2555922932484284",
            "0.25903821218823886",
            "0.2580238361663203",
            "0.25456521739130433",
            "0.25510041186424437",
            "0.24668134918240514",
            "0.23671290746132329",
            "0.2346844037968544",
            "0.22545959980068708",
            "0.21896193946755746",
            "0.2137383188956712",
            "0.21158201619121053",
            "0.21121461626299662",
            "0.21121461626299662",
            "0.21121461626299662"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3011",
        "input_tokens": "358302",
        "output_tokens": "912578",
        "mean_ttft": "3205.33",
        "median_ttft": "194.26",
        "p99_ttft": "22621.35",
        "hit_ratios": [
            "0.0151709951144253",
            "0.03936284270179201",
            "0.045271178843567905",
            "0.05285307587572719",
            "0.08570636094674555",
            "0.10644257703081234",
            "0.10806481424434725",
            "0.10839142233810464",
            "0.11618623218678922",
            "0.11483964195399991",
            "0.11692015209125474",
            "0.12430141287284142",
            "0.1262670141905589",
            "0.13941711723592246",
            "0.14402439024390243",
            "0.148377647589004",
            "0.15049235026041666",
            "0.15090742717706265",
            "0.15237959735363163",
            "0.15158386240720215",
            "0.14994236680327871",
            "0.14360910170995447",
            "0.13734102718686306",
            "0.13562592844548726",
            "0.1306292635940201",
            "0.12636383175088817",
            "0.12475958299133887",
            "0.12428489014951206",
            "0.12303127410836155",
            "0.12303127410836155",
            "0.12303127410836155"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3015",
        "input_tokens": "358655",
        "output_tokens": "912447",
        "mean_ttft": "656.86",
        "median_ttft": "186.26",
        "p99_ttft": "7793.36",
        "hit_ratios": [
            "0.026474347270403504",
            "0.04585705249841873",
            "0.04555913483663138",
            "0.09120318526813487",
            "0.13914430474760744",
            "0.18182510664229132",
            "0.1931640012543117",
            "0.19604076623445926",
            "0.2045740956826138",
            "0.20883920342989948",
            "0.2143488873951959",
            "0.2182879743855354",
            "0.22306040735797603",
            "0.24212258766690564",
            "0.2514535593882836",
            "0.2564277123471078",
            "0.25626860194887263",
            "0.2589103529815595",
            "0.25789548474190904",
            "0.2549045887852033",
            "0.25651276966624553",
            "0.24819812332844773",
            "0.23816398879295553",
            "0.2355381615521843",
            "0.22636290946270102",
            "0.21940351410197984",
            "0.21425696688822485",
            "0.21239344103938754",
            "0.21178140866761305",
            "0.21178140866761305",
            "0.21178140866761305"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3005",
        "input_tokens": "358128",
        "output_tokens": "910881",
        "mean_ttft": "3446.31",
        "median_ttft": "202.16",
        "p99_ttft": "24796.31",
        "hit_ratios": [
            "0.022278481012658224",
            "0.0529585798816568",
            "0.058280438545874204",
            "0.06569606545542053",
            "0.09289667059784089",
            "0.11436366317652263",
            "0.11119257086999024",
            "0.10954343690551681",
            "0.11610383643464278",
            "0.11519384151422563",
            "0.11692458855318105",
            "0.12318817894374354",
            "0.12561936130602894",
            "0.13631469761823486",
            "0.13993405740884415",
            "0.14449495062585377",
            "0.14816912805988272",
            "0.14806642445454724",
            "0.1492331369739426",
            "0.1496432688933817",
            "0.14808716087672463",
            "0.14039523090041445",
            "0.13422551252847387",
            "0.13317831388669746",
            "0.12861587954539463",
            "0.12656744256386346",
            "0.12574974398985714",
            "0.12498948810052983",
            "0.12414267745686693",
            "0.12414267745686693",
            "0.12414267745686693"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3017",
        "input_tokens": "358708",
        "output_tokens": "913754",
        "mean_ttft": "547.53",
        "median_ttft": "187.58",
        "p99_ttft": "7616.86",
        "hit_ratios": [
            "0.02173132183908046",
            "0.042177303835747255",
            "0.0422360248447205",
            "0.061897005387796016",
            "0.09166507359969413",
            "0.12860171154903038",
            "0.1376613218615565",
            "0.1414564283353531",
            "0.14308068459657702",
            "0.14769153352622974",
            "0.15336829966893578",
            "0.15563321684140455",
            "0.16933063874089044",
            "0.18654510984721756",
            "0.19344135802469134",
            "0.19410372283193458",
            "0.19025911192344905",
            "0.18793933412556144",
            "0.18554171738926864",
            "0.18420819999646398",
            "0.18189492166396537",
            "0.17808306811457444",
            "0.16986160322219188",
            "0.16579770594369128",
            "0.1572473082611159",
            "0.15262857370496757",
            "0.15112618689691498",
            "0.14955751088764455",
            "0.14932046459196208",
            "0.14932046459196208",
            "0.14932046459196208"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3001",
        "input_tokens": "358075",
        "output_tokens": "909629",
        "mean_ttft": "2546.49",
        "median_ttft": "198.51",
        "p99_ttft": "20668.16",
        "hit_ratios": [
            "0.01771414705168648",
            "0.04179870227855742",
            "0.04747207524985303",
            "0.04982249969396498",
            "0.06811377245508982",
            "0.07197747850566842",
            "0.0757527733755943",
            "0.07294026634248771",
            "0.0713485608532606",
            "0.07430184069752749",
            "0.07351512887560702",
            "0.07118746031215534",
            "0.06962413391378992",
            "0.07763706002404316",
            "0.08473876940533294",
            "0.08721374045801528",
            "0.08292682926829269",
            "0.0820913558366229",
            "0.07731842737094838",
            "0.07517838488641795",
            "0.07360633813546409",
            "0.07100085543199314",
            "0.06837541946945652",
            "0.06673618352450468",
            "0.06340025582559367",
            "0.061980590853037344",
            "0.0611913122642736",
            "0.06137184115523462",
            "0.06114433407662676",
            "0.06114433407662676",
            "0.06114433407662676"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3011",
        "input_tokens": "358288",
        "output_tokens": "912610",
        "mean_ttft": "542.48",
        "median_ttft": "185.78",
        "p99_ttft": "6943.94",
        "hit_ratios": [
            "0.0220351128627732",
            "0.04228028503562945",
            "0.042303535587463324",
            "0.062039695418799154",
            "0.09376496504166265",
            "0.1324313877077696",
            "0.14492659477718595",
            "0.1481274455002795",
            "0.14912888536923383",
            "0.15483213785492977",
            "0.1592256321752833",
            "0.16018039084683483",
            "0.1713226735281505",
            "0.18389639639639646",
            "0.19080222193515053",
            "0.19254926403605505",
            "0.1896808120864674",
            "0.18699695398704944",
            "0.1847924187725632",
            "0.18183906015369672",
            "0.1801810933171161",
            "0.17441382147264503",
            "0.16653846733933614",
            "0.16213889699445583",
            "0.15481333241322207",
            "0.15017747404111045",
            "0.14940418100570138",
            "0.1478642674043806",
            "0.1476337578811435",
            "0.1476337578811435",
            "0.1476337578811435"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3001",
        "input_tokens": "358075",
        "output_tokens": "909798",
        "mean_ttft": "2202.07",
        "median_ttft": "190.12",
        "p99_ttft": "18183.43",
        "hit_ratios": [
            "0.013121372697451426",
            "0.03652758673391411",
            "0.04240440410653177",
            "0.045651904230244386",
            "0.06448282335273138",
            "0.0722558870905883",
            "0.07668181527235485",
            "0.07562558952449647",
            "0.07437215165325317",
            "0.0771593251714418",
            "0.07557384951978344",
            "0.07289595758780648",
            "0.06994873661540328",
            "0.07779227629862018",
            "0.08489378644268065",
            "0.08856395625297192",
            "0.08404835776184869",
            "0.08322629846672552",
            "0.07872543336387605",
            "0.07616361071932297",
            "0.07463240879855491",
            "0.07207135715079271",
            "0.06898064125831815",
            "0.06744240576821614",
            "0.06424414162881467",
            "0.06251833675619445",
            "0.06165765579325864",
            "0.06182043719858737",
            "0.06169282609512591",
            "0.06169282609512591",
            "0.06169282609512591"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3016",
        "input_tokens": "358679",
        "output_tokens": "913965",
        "mean_ttft": "244.49",
        "median_ttft": "179.14",
        "p99_ttft": "1516.53",
        "hit_ratios": [
            "0.03665097511768661",
            "0.05566343042071197",
            "0.06899810964083175",
            "0.14713311442283405",
            "0.22078045987978248",
            "0.27118903606155725",
            "0.2945410535702911",
            "0.2991292195226833",
            "0.3001318639917113",
            "0.30382920221584236",
            "0.3075849731663685",
            "0.31908479309469406",
            "0.3323623652781824",
            "0.3490264070418778",
            "0.3536806508527739",
            "0.3597929446104028",
            "0.3563453020065729",
            "0.3558323289138877",
            "0.3509983272235469",
            "0.3548906750792878",
            "0.3580049043963265",
            "0.35232823677086644",
            "0.3421701249570102",
            "0.3379367720465891",
            "0.32654933361290583",
            "0.3134739228460035",
            "0.31028117359413215",
            "0.3078535935038178",
            "0.30631672812281596",
            "0.30631672812281596",
            "0.30631672812281596"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3018",
        "input_tokens": "358654",
        "output_tokens": "914159",
        "mean_ttft": "240.91",
        "median_ttft": "177.47",
        "p99_ttft": "1510.78",
        "hit_ratios": [
            "0.03663865546218487",
            "0.05566343042071197",
            "0.06894380607586967",
            "0.1592260022764639",
            "0.24968991508443855",
            "0.3166088631984586",
            "0.35123782854960867",
            "0.3558829855882986",
            "0.37070678399091683",
            "0.38127946675337343",
            "0.38368105172906547",
            "0.4044904569849789",
            "0.41708351616205935",
            "0.4313981706178831",
            "0.4367305900240326",
            "0.44046018908759543",
            "0.43671598420201785",
            "0.4342495929508669",
            "0.4313844181740494",
            "0.43643690706070026",
            "0.4385051579419492",
            "0.4348943763136805",
            "0.4249681492191191",
            "0.41982269012328577",
            "0.4056901725922917",
            "0.391158623954946",
            "0.3864730168812451",
            "0.38327888687235334",
            "0.3811528146909914",
            "0.3811528146909914",
            "0.3811528146909914"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3020",
        "input_tokens": "358691",
        "output_tokens": "914271",
        "mean_ttft": "235.97",
        "median_ttft": "172.81",
        "p99_ttft": "1489.49",
        "hit_ratios": [
            "0.036632498739707614",
            "0.05566343042071197",
            "0.06894380607586967",
            "0.1592260022764639",
            "0.24968991508443852",
            "0.3166088631984586",
            "0.35123782854960867",
            "0.3547868061142398",
            "0.37004446967546595",
            "0.38071045358478306",
            "0.3818948270934553",
            "0.4025850296929087",
            "0.41509433962264153",
            "0.42963812368329823",
            "0.43511207023394977",
            "0.4389338193416107",
            "0.43534491579184326",
            "0.4330236567378605",
            "0.43108153909274166",
            "0.43534547896902026",
            "0.43746395848016917",
            "0.43371613841585355",
            "0.4243409742120344",
            "0.4192166971561616",
            "0.4047859040986503",
            "0.39060823121271865",
            "0.38529810877883586",
            "0.38199166616341557",
            "0.37985621872037056",
            "0.37985621872037056",
            "0.37985621872037056"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "3015",
        "input_tokens": "358686",
        "output_tokens": "912374",
        "mean_ttft": "245.28",
        "median_ttft": "182.49",
        "p99_ttft": "1493.68",
        "hit_ratios": [
            "0.03663865546218487",
            "0.05566343042071197",
            "0.06894380607586967",
            "0.14607309978500063",
            "0.220548989706443",
            "0.267510027769207",
            "0.2979276253247988",
            "0.29857335127860024",
            "0.29905437352245867",
            "0.3025281581719472",
            "0.30898293564197055",
            "0.31850042817723373",
            "0.3306086702671143",
            "0.3439021779846952",
            "0.35316067264023565",
            "0.35858147606868834",
            "0.3562081464643361",
            "0.35473296783345465",
            "0.34946198246989235",
            "0.3534155438325325",
            "0.3575139503559746",
            "0.35210712879086264",
            "0.3414151835611728",
            "0.33798878795888",
            "0.32568324696846157",
            "0.31285844589107004",
            "0.3092466801297351",
            "0.3069751632717474",
            "0.30555220131861777",
            "0.30555220131861777",
            "0.30555220131861777"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "3023",
        "input_tokens": "358839",
        "output_tokens": "914342",
        "mean_ttft": "240.96",
        "median_ttft": "174.07",
        "p99_ttft": "1498.88",
        "hit_ratios": [
            "0.03585858585858586",
            "0.05165155440414508",
            "0.051443900899479256",
            "0.10214168039538715",
            "0.16407382355783168",
            "0.20518425983760152",
            "0.22815945716709077",
            "0.23859903112645472",
            "0.25168450257629804",
            "0.2556461198845305",
            "0.2540514057435743",
            "0.26469500924214423",
            "0.280205337539042",
            "0.29529345052452505",
            "0.30015020458900915",
            "0.30646632422831355",
            "0.3088597742897912",
            "0.30120724346076466",
            "0.29792061200382514",
            "0.29787534660285064",
            "0.29459093982420564",
            "0.2899814411877641",
            "0.2797163678147018",
            "0.27369961226132133",
            "0.2627555604705493",
            "0.2531865585168019",
            "0.25004177861192173",
            "0.24752638941879695",
            "0.24632311097059753",
            "0.24632311097059753",
            "0.24632311097059753"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3020",
        "input_tokens": "358758",
        "output_tokens": "914328",
        "mean_ttft": "235.35",
        "median_ttft": "173.81",
        "p99_ttft": "1491.78",
        "hit_ratios": [
            "0.03632694248234107",
            "0.05521373056994819",
            "0.06690863184472148",
            "0.14038657171922686",
            "0.2049743540114197",
            "0.2649941199529596",
            "0.30349273169769125",
            "0.32494992210104606",
            "0.3482594465932758",
            "0.34432453184319417",
            "0.3564905660377359",
            "0.3779089376053963",
            "0.39461148230635984",
            "0.40462036906606574",
            "0.4067933158346111",
            "0.40997443688805296",
            "0.40710471124948666",
            "0.40165757024459287",
            "0.40071028599346104",
            "0.4001134973133059",
            "0.3973053131090587",
            "0.39166947128868396",
            "0.37998574958688985",
            "0.3734469085034515",
            "0.3576282940360613",
            "0.34529124290054164",
            "0.340224545102594",
            "0.3366991332320616",
            "0.3350259606718039",
            "0.3350259606718039",
            "0.3350259606718039"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3023",
        "input_tokens": "358870",
        "output_tokens": "914285",
        "mean_ttft": "240.95",
        "median_ttft": "179.16",
        "p99_ttft": "1506.91",
        "hit_ratios": [
            "0.035828427249789734",
            "0.05165155440414508",
            "0.0514520202020202",
            "0.10236918788800203",
            "0.16470361073566325",
            "0.21742902208201892",
            "0.2374435203981402",
            "0.24526420737786636",
            "0.25104623110629704",
            "0.25377924161810655",
            "0.25422904191616763",
            "0.2663385106595269",
            "0.2808328230251071",
            "0.2961984771430979",
            "0.3013991049843114",
            "0.3060394333843796",
            "0.3075832742735648",
            "0.3004133392190697",
            "0.2963494667760459",
            "0.2972778109942672",
            "0.2945233129247124",
            "0.2905634542820297",
            "0.27985444922262653",
            "0.2741578272525935",
            "0.2632651655993941",
            "0.2543338155991056",
            "0.25070834241464635",
            "0.24793241891155948",
            "0.24660775872919974",
            "0.24660775872919974",
            "0.24660775872919974"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "3019",
        "input_tokens": "358748",
        "output_tokens": "914108",
        "mean_ttft": "237.99",
        "median_ttft": "171.99",
        "p99_ttft": "1470.16",
        "hit_ratios": [
            "0.03632083403396671",
            "0.05521373056994819",
            "0.06690863184472148",
            "0.14672400708322794",
            "0.21734104046242775",
            "0.2711345065996229",
            "0.30971712938711365",
            "0.3318552186685882",
            "0.3510899450117832",
            "0.34728439902018754",
            "0.35690992915776454",
            "0.3801321850590828",
            "0.397389145956547",
            "0.40514666889949486",
            "0.40740836145385245",
            "0.4103762281332376",
            "0.4086088316585607",
            "0.4023666265543523",
            "0.4028657673101291",
            "0.402625935951067",
            "0.4001443292048469",
            "0.39436396487780145",
            "0.3823163138231632",
            "0.3751559643675827",
            "0.359886221538208",
            "0.3474767040100515",
            "0.34242300214877747",
            "0.3389950639159601",
            "0.33735743598781454",
            "0.33735743598781454",
            "0.33735743598781454"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_sharegpt_20/sharegpt_epoch19_metric_0_5427.pt",
        "dataset_file": "/scratch/gpfs/dy5/.cache/huggingface/ShareGPT_V3_unfiltered_cleaned_split.json",
        "time_limit": 1200,
        "dataset_name": "sharegpt_0514",
        "scale": 1,
        "result_file": "sharegpt-size+++/client_logs/8001_lru.json"
    }
]