[
    {
        "num_requests": "4971",
        "input_tokens": "310408",
        "output_tokens": "860456",
        "mean_ttft": "171.86",
        "median_ttft": "152.75",
        "p99_ttft": "412.95",
        "hit_ratios": [
            "0.03929273084479371",
            "0.061121613106490225",
            "0.0675542406311637",
            "0.0743467059256533",
            "0.09339678762641285",
            "0.09642761214074672",
            "0.10338770388958596",
            "0.11985018726591762",
            "0.14767932489451477",
            "0.1717044500419815",
            "0.17888888888888885",
            "0.19009166302924488",
            "0.19825100903325005",
            "0.19596117178020456",
            "0.19405924992121024",
            "0.1931652579422909",
            "0.18706235411803937",
            "0.19129579542660438",
            "0.18759619221341847",
            "0.18378407383558704",
            "0.18417434696267632",
            "0.18214858869064476",
            "0.1792133597011646",
            "0.1818256884521696",
            "0.17928726127190395",
            "0.17814167433302672",
            "0.17553523176054878",
            "0.1745843621399177",
            "0.17344147582697203",
            "0.1772969333414948",
            "0.1743076834133087",
            "0.17356881851400735",
            "0.1777244231025744",
            "0.18031040779062696",
            "0.18112798264642085",
            "0.1826142826547367",
            "0.18228169339024108",
            "0.18052277886409093",
            "0.1784033485870437",
            "0.17922772980996382",
            "0.18420945643777686",
            "0.1821904799588493",
            "0.18370582617000947",
            "0.18200067539679554",
            "0.1796379758894873",
            "0.1787377924857466",
            "0.17838665399641002",
            "0.17601387910747715",
            "0.1747695243937767",
            "0.1747695243937767"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "4992",
        "input_tokens": "312075",
        "output_tokens": "879273",
        "mean_ttft": "165.80",
        "median_ttft": "145.63",
        "p99_ttft": "398.25",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06182281708094328",
            "0.06986027944111775",
            "0.08664931201190033",
            "0.10647307924984875",
            "0.10859606575047157",
            "0.13012167866898436",
            "0.1563084597796716",
            "0.21827904715605248",
            "0.23773584905660378",
            "0.25334972341733253",
            "0.270824247710423",
            "0.28093130652299403",
            "0.2738373603533385",
            "0.2780580075662043",
            "0.27409243329931476",
            "0.27361194427781105",
            "0.2814400688087485",
            "0.2868782405560937",
            "0.2870092254880927",
            "0.28527076547231267",
            "0.2847841472045293",
            "0.2959915518986227",
            "0.29824994852789777",
            "0.29805954906119875",
            "0.3005188974349537",
            "0.29791428867904934",
            "0.29466281056921245",
            "0.2962622451891068",
            "0.2994815492528209",
            "0.29922462744645884",
            "0.2974613686534215",
            "0.30077346304122465",
            "0.30254262940167476",
            "0.3023843398910856",
            "0.3043828285937536",
            "0.30525447420884977",
            "0.304164894926482",
            "0.30489410850370235",
            "0.3031798588117698",
            "0.30495262006965246",
            "0.30404765661985156",
            "0.30695010086400476",
            "0.30494546541162404",
            "0.30277864159364876",
            "0.30165148166118566",
            "0.29718440323680023",
            "0.29403831051319695",
            "0.2904530744336569",
            "0.2904530744336569"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "5012",
        "input_tokens": "313518",
        "output_tokens": "867572",
        "mean_ttft": "167.88",
        "median_ttft": "148.47",
        "p99_ttft": "397.30",
        "hit_ratios": [
            "0.03685258964143426",
            "0.06254158349966733",
            "0.07003501750875436",
            "0.06599552572706935",
            "0.07299270072992702",
            "0.07348938486663038",
            "0.07035175879396985",
            "0.07708508845829823",
            "0.11167763157894736",
            "0.12082919210563678",
            "0.11615403850962738",
            "0.12762159750111557",
            "0.13116370808678499",
            "0.12835129598289832",
            "0.12371888726207904",
            "0.11866826995340447",
            "0.12741127205327107",
            "0.13545287908476075",
            "0.13622490902688106",
            "0.1352236155809566",
            "0.13482020457661076",
            "0.13171161470314718",
            "0.13181526619627965",
            "0.13093289689034368",
            "0.13418831434893058",
            "0.13398266738246792",
            "0.1368367605991368",
            "0.1378882415801992",
            "0.1378817111303306",
            "0.13801491534103635",
            "0.13592883689758115",
            "0.1346859172148803",
            "0.14018717698002509",
            "0.13769468743332616",
            "0.13604029285009603",
            "0.13661037394451142",
            "0.13526205654776385",
            "0.13446695323817892",
            "0.13373915829461977",
            "0.13347546099914281",
            "0.13575542186730608",
            "0.13499833361106484",
            "0.13349407273457906",
            "0.13623005463403087",
            "0.13587659516960443",
            "0.13613368953561072",
            "0.1337613598734317",
            "0.13157847549714",
            "0.13041096858546242",
            "0.13041096858546242",
            "0.13041096858546242"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "4997",
        "input_tokens": "312551",
        "output_tokens": "866687",
        "mean_ttft": "166.01",
        "median_ttft": "146.95",
        "p99_ttft": "370.81",
        "hit_ratios": [
            "0.03944773175542406",
            "0.061626429479034316",
            "0.06986027944111775",
            "0.08351976137211035",
            "0.10567871242028544",
            "0.10800542740841247",
            "0.10819009100101111",
            "0.12703445360388924",
            "0.17027250206440958",
            "0.19296740994854203",
            "0.20409452799191205",
            "0.22305540011191943",
            "0.23173853120693055",
            "0.22639503985828172",
            "0.2243729333010727",
            "0.22049180327868853",
            "0.23155597981726442",
            "0.23966578715919087",
            "0.2426590538336052",
            "0.2382936725518149",
            "0.24244480400855997",
            "0.23982360922659435",
            "0.23998180577666595",
            "0.24064148375021274",
            "0.24494190298204277",
            "0.2485322150209684",
            "0.2500629836242577",
            "0.25529508533826856",
            "0.2554052261573153",
            "0.2591576260370135",
            "0.25967800289435605",
            "0.2575617373199931",
            "0.26545333481300637",
            "0.26159353042556016",
            "0.2573929561556629",
            "0.25665517155829015",
            "0.25609697666618764",
            "0.2546639167526016",
            "0.25309550218439464",
            "0.251092605074906",
            "0.2531259271817913",
            "0.25303810504634405",
            "0.248763433384319",
            "0.2493661504856263",
            "0.24712369540745266",
            "0.24810591853574382",
            "0.24347492323439104",
            "0.24001138506421893",
            "0.23740022805017108",
            "0.23740022805017108"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "4998",
        "input_tokens": "312564",
        "output_tokens": "866489",
        "mean_ttft": "169.86",
        "median_ttft": "152.28",
        "p99_ttft": "384.85",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06158730158730158",
            "0.06979062811565304",
            "0.09537892791127542",
            "0.11960132890365448",
            "0.12968917470525188",
            "0.15498247371056587",
            "0.2028654485049834",
            "0.2722411278561011",
            "0.30635918937805734",
            "0.3263002944062807",
            "0.342854028126022",
            "0.35084013442150747",
            "0.34259980947432234",
            "0.35170459018974887",
            "0.34581352833638024",
            "0.3489409884108166",
            "0.35510229157707196",
            "0.3623105844821693",
            "0.36330973830973834",
            "0.3610036644951139",
            "0.3629832687399563",
            "0.37326820603907623",
            "0.3808640448511829",
            "0.3854178923010549",
            "0.38929109551284397",
            "0.3921331629657767",
            "0.39591675966651335",
            "0.3979291346062505",
            "0.4001461943776078",
            "0.4007946791051221",
            "0.3969072164948452",
            "0.39485443824532623",
            "0.3966718168232819",
            "0.39805992564689646",
            "0.403124032669",
            "0.40231368391943567",
            "0.402788379506982",
            "0.4020408163265304",
            "0.4002708897687016",
            "0.4033519553072624",
            "0.4024240746599176",
            "0.4029887777692952",
            "0.4010608985773461",
            "0.3986916127613567",
            "0.3950044923629828",
            "0.3926888451258966",
            "0.38670886075949346",
            "0.38305525533639545",
            "0.38305525533639545"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "4988",
        "input_tokens": "312003",
        "output_tokens": "865250",
        "mean_ttft": "163.78",
        "median_ttft": "143.01",
        "p99_ttft": "336.54",
        "hit_ratios": [
            "0.03929273084479371",
            "0.06182281708094328",
            "0.06979062811565304",
            "0.09537892791127542",
            "0.12008469449485783",
            "0.13344051446945338",
            "0.16786689843555996",
            "0.22926626480981088",
            "0.30238210986874087",
            "0.3323549965059399",
            "0.3581943081452405",
            "0.3756527415143604",
            "0.38290926548247733",
            "0.3786956521739131",
            "0.3956381387292339",
            "0.39758246559382515",
            "0.40705192294874365",
            "0.413589727836825",
            "0.41763063422417235",
            "0.4210469856254024",
            "0.4237581433224756",
            "0.43538570417551314",
            "0.44729682288924",
            "0.45345382520425853",
            "0.45905629269058656",
            "0.46702041417937956",
            "0.47386434349719986",
            "0.4762671221627304",
            "0.47758025160820117",
            "0.48021944529106986",
            "0.4796300564711308",
            "0.47916149496621174",
            "0.47814142060761267",
            "0.48135139232829643",
            "0.48280270436386",
            "0.4864575908766929",
            "0.4840441464482386",
            "0.4833874761958106",
            "0.4810923007070118",
            "0.4802944907763658",
            "0.48252159454965726",
            "0.4815114763165172",
            "0.48321137281805016",
            "0.48364643365017584",
            "0.48065964269354094",
            "0.47653312705751144",
            "0.4719740191345563",
            "0.46869495322627536",
            "0.465253736384362",
            "0.465253736384362"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "5025",
        "input_tokens": "313898",
        "output_tokens": "870474",
        "mean_ttft": "164.06",
        "median_ttft": "144.85",
        "p99_ttft": "338.73",
        "hit_ratios": [
            "0.03944773175542406",
            "0.06012439530062197",
            "0.06986027944111775",
            "0.09097688292319164",
            "0.11787878787878787",
            "0.1327001356852103",
            "0.1595878361397336",
            "0.2029169308814204",
            "0.26913539428004624",
            "0.3017818959372773",
            "0.32489028213166143",
            "0.342281131655157",
            "0.3471716674864732",
            "0.34847138286526835",
            "0.3577446532728451",
            "0.3621577258822651",
            "0.366848940533151",
            "0.3821511737680156",
            "0.3804449648711944",
            "0.37979998894966566",
            "0.379699642932157",
            "0.3761807381439283",
            "0.3833302903049114",
            "0.39057757257064685",
            "0.39953357063949924",
            "0.4057904235303153",
            "0.41032118368819925",
            "0.4153408311617062",
            "0.420535389298832",
            "0.42213740458015264",
            "0.424136370493287",
            "0.42515280821127904",
            "0.42626318711826766",
            "0.4263980805231102",
            "0.4276084783555886",
            "0.42847217052532327",
            "0.43119705164409133",
            "0.42778050318873084",
            "0.4266069499459849",
            "0.4252396097012182",
            "0.4259688289806235",
            "0.4266122750194744",
            "0.42570281124497994",
            "0.42629133536810593",
            "0.42518577646007955",
            "0.4238949786185132",
            "0.4184067778160774",
            "0.41713215018030125",
            "0.4129249211576324",
            "0.4125182761261575",
            "0.4125182761261575"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "5014",
        "input_tokens": "313558",
        "output_tokens": "868604",
        "mean_ttft": "169.30",
        "median_ttft": "149.48",
        "p99_ttft": "376.66",
        "hit_ratios": [
            "0.03933136676499509",
            "0.061626429479034316",
            "0.06986027944111775",
            "0.09218289085545722",
            "0.11770045385779121",
            "0.12328398384925975",
            "0.13338338338338337",
            "0.1582597730138714",
            "0.2220578566732413",
            "0.25637373593505197",
            "0.26601723491944546",
            "0.28389404269587576",
            "0.2968288359267284",
            "0.30269934292310424",
            "0.30051771558000323",
            "0.29656310971034067",
            "0.30844377647219556",
            "0.3213387015601409",
            "0.31911790443964766",
            "0.31663635862677025",
            "0.3180100755667506",
            "0.31617682897109717",
            "0.32441929448272716",
            "0.3299615877080666",
            "0.33746776372344345",
            "0.33998238829970523",
            "0.3407631825723148",
            "0.3461300946891725",
            "0.3484873587594023",
            "0.35131432212840524",
            "0.3519323671497585",
            "0.3486722075815934",
            "0.35389357920462117",
            "0.3521567379835096",
            "0.35316426304790893",
            "0.354960975488118",
            "0.35396081259766793",
            "0.3507561124982333",
            "0.34872994956150305",
            "0.3450127709738685",
            "0.34711728776044426",
            "0.34750657254642175",
            "0.3491317221510883",
            "0.3498959110727051",
            "0.3461464650341598",
            "0.3448600417898085",
            "0.34083542065713857",
            "0.3367431028305267",
            "0.3328510172751495",
            "0.3328510172751495",
            "0.3328510172751495"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "5022",
        "input_tokens": "313879",
        "output_tokens": "868667",
        "mean_ttft": "167.52",
        "median_ttft": "147.31",
        "p99_ttft": "400.10",
        "hit_ratios": [
            "0.03929273084479371",
            "0.06158730158730158",
            "0.06979062811565304",
            "0.0875046347793845",
            "0.10647307924984875",
            "0.10798499464094319",
            "0.1311967951927892",
            "0.1563084597796716",
            "0.21827904715605248",
            "0.23776908023483367",
            "0.25438163416440385",
            "0.270824247710423",
            "0.2801728276524244",
            "0.2736641551918247",
            "0.27790037831021436",
            "0.27473967814752787",
            "0.2732786775978138",
            "0.2811328868956196",
            "0.28611316884152943",
            "0.28384466852606743",
            "0.2822679153094463",
            "0.28083939880896114",
            "0.29337206231845786",
            "0.296881462486558",
            "0.29627153307637855",
            "0.2995067726737338",
            "0.2966166193869785",
            "0.2966505604312527",
            "0.29707020102733217",
            "0.3002744739249772",
            "0.29998846863468637",
            "0.2981923554574308",
            "0.29881775239518577",
            "0.30295522916298007",
            "0.30282019129109206",
            "0.3047738812698715",
            "0.3056697361471514",
            "0.3043838809449102",
            "0.30527317558506734",
            "0.3035423707597948",
            "0.3052879251942151",
            "0.30511589305827264",
            "0.30807936417176524",
            "0.3059655423985634",
            "0.30401098901098905",
            "0.30286074127383955",
            "0.3002176125794111",
            "0.2959837367818645",
            "0.29302435007646166",
            "0.29302435007646166",
            "0.29302435007646166"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "4974",
        "input_tokens": "310467",
        "output_tokens": "863002",
        "mean_ttft": "168.31",
        "median_ttft": "148.69",
        "p99_ttft": "395.25",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06158730158730158",
            "0.06786427145708583",
            "0.0736607142857143",
            "0.09437386569872958",
            "0.09620048504446241",
            "0.10255773528681401",
            "0.12409062564955313",
            "0.15070491006319886",
            "0.17430807939614204",
            "0.1809429770427055",
            "0.19208546822195577",
            "0.20000000000000004",
            "0.19754048670650384",
            "0.19569672131147545",
            "0.19115173674588667",
            "0.18829567419849363",
            "0.19235731400135161",
            "0.1886147358823865",
            "0.18499249088178507",
            "0.1853114820846906",
            "0.1818697419415824",
            "0.18563822765873192",
            "0.1877145811789038",
            "0.18569794501636883",
            "0.1834619625137817",
            "0.18066528066528065",
            "0.17944411512876243",
            "0.17517737265756736",
            "0.1774070105617634",
            "0.17438195749602428",
            "0.17403345518998561",
            "0.1763352857792399",
            "0.18209008186956632",
            "0.18231500172320422",
            "0.18390257825135575",
            "0.18271814778234607",
            "0.18093184166778994",
            "0.17915797705943695",
            "0.17958791323609313",
            "0.18454002195211192",
            "0.1825301085688295",
            "0.18353201051148268",
            "0.18146963661186857",
            "0.17919201885654776",
            "0.17817451781745186",
            "0.17788385602218287",
            "0.1753791379959605",
            "0.17430397389264718",
            "0.17430397389264718"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "5039",
        "input_tokens": "314280",
        "output_tokens": "872550",
        "mean_ttft": "167.64",
        "median_ttft": "147.64",
        "p99_ttft": "388.98",
        "hit_ratios": [
            "0.03944773175542406",
            "0.061626429479034316",
            "0.06993006993006994",
            "0.08558725453871804",
            "0.1060145808019441",
            "0.10855441256090957",
            "0.10828506673382018",
            "0.1278083933870284",
            "0.17013201320132013",
            "0.19240074000284615",
            "0.2056133316626989",
            "0.22497212931995536",
            "0.23250319913377296",
            "0.22512205947625383",
            "0.2220066294769181",
            "0.2190918627304061",
            "0.2320954003407155",
            "0.24041483343808925",
            "0.24129047368112888",
            "0.23716853189260712",
            "0.2403080469404862",
            "0.23689717261180596",
            "0.23623201686062498",
            "0.23836134634397968",
            "0.2411047728485246",
            "0.2465605611006204",
            "0.24806792206378578",
            "0.25459371875754133",
            "0.2549307036247336",
            "0.25958768166976126",
            "0.25943638950267883",
            "0.257156114961863",
            "0.261193611655926",
            "0.2606425276997296",
            "0.25768076962863345",
            "0.2572989968558167",
            "0.2566161884948473",
            "0.2553638941398865",
            "0.25400223168537794",
            "0.2526477359938603",
            "0.2541491786863242",
            "0.25417693215461373",
            "0.25166859837736305",
            "0.25257600439638084",
            "0.2505434887165971",
            "0.2507653929016896",
            "0.24611675500588934",
            "0.24226435342514763",
            "0.2390620330819667",
            "0.23889220610445722",
            "0.23889220610445722"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "5031",
        "input_tokens": "314025",
        "output_tokens": "872669",
        "mean_ttft": "171.24",
        "median_ttft": "153.66",
        "p99_ttft": "380.22",
        "hit_ratios": [
            "0.03944773175542406",
            "0.06116015132408576",
            "0.06986027944111775",
            "0.06599552572706935",
            "0.0736270368135184",
            "0.07098177862387817",
            "0.06869455006337136",
            "0.07422120008362952",
            "0.10062997347480106",
            "0.11138118387189018",
            "0.10865445356917244",
            "0.11999104544436981",
            "0.12380577169309562",
            "0.12190560997328581",
            "0.11648209522269823",
            "0.1124118265045775",
            "0.12282497441146367",
            "0.13096134538152612",
            "0.13212722497811497",
            "0.13145565782946592",
            "0.13130571578395386",
            "0.1282750560046752",
            "0.12983273923772967",
            "0.1287865822351532",
            "0.13134499569830804",
            "0.13099900176610615",
            "0.13349242506417908",
            "0.1345248324454374",
            "0.13630640779272418",
            "0.13465889175668358",
            "0.13175167098211601",
            "0.13093450386970087",
            "0.13673663056827065",
            "0.1340795427482735",
            "0.13258901008437957",
            "0.13288036038726705",
            "0.13186308848039818",
            "0.1306922317778092",
            "0.13019133115705486",
            "0.13006642709354255",
            "0.1324334649178659",
            "0.1322157073251302",
            "0.13070841050765783",
            "0.13286384976525836",
            "0.13204329916658697",
            "0.13175079752298757",
            "0.13041642185663935",
            "0.12790365744870663",
            "0.12660560117919573",
            "0.12655008506831786",
            "0.12655008506831786"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "5026",
        "input_tokens": "313932",
        "output_tokens": "870392",
        "mean_ttft": "168.81",
        "median_ttft": "147.36",
        "p99_ttft": "409.31",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06158730158730158",
            "0.06779661016949154",
            "0.0736607142857143",
            "0.09512341962673089",
            "0.09751485683414371",
            "0.10464240903387705",
            "0.12649855312112446",
            "0.14849074975657256",
            "0.17242827151854445",
            "0.17931290163124072",
            "0.1906372762985596",
            "0.19873150105708245",
            "0.19639452244756456",
            "0.1947314456976102",
            "0.19360244826581172",
            "0.1874749899959984",
            "0.19149981574745117",
            "0.18797035347776514",
            "0.18631607190770058",
            "0.18656754417231022",
            "0.18436703483432457",
            "0.1877256317689531",
            "0.18978071990070333",
            "0.18844913053741444",
            "0.18685567010309279",
            "0.18387186051338825",
            "0.18250863060989644",
            "0.1778940691405011",
            "0.17988223449369983",
            "0.17687427912341408",
            "0.17575289148977283",
            "0.18010652463382157",
            "0.18239057324196528",
            "0.18272988717646194",
            "0.18418929181697363",
            "0.1831525353760063",
            "0.18214221664275476",
            "0.18010124610591907",
            "0.18086260115124722",
            "0.1857186327213714",
            "0.18379809877665573",
            "0.18518165529335526",
            "0.18344347305165024",
            "0.18152656083880195",
            "0.1807131280388979",
            "0.17972673948930493",
            "0.17653282367195103",
            "0.17461838477573804",
            "0.17461838477573804",
            "0.17461838477573804"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "5027",
        "input_tokens": "313986",
        "output_tokens": "872922",
        "mean_ttft": "168.77",
        "median_ttft": "149.94",
        "p99_ttft": "380.91",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06158730158730158",
            "0.06979062811565304",
            "0.09537892791127542",
            "0.11288380493678506",
            "0.1144238517324738",
            "0.1372647427854454",
            "0.1622960974602519",
            "0.21924699772801037",
            "0.23859501819199552",
            "0.2551587791918942",
            "0.27149716281099956",
            "0.27974245627522587",
            "0.27417391304347827",
            "0.2772612669398046",
            "0.271330308795551",
            "0.27210884353741494",
            "0.2801819522989918",
            "0.28563283922462934",
            "0.2831079630822065",
            "0.2815825653037323",
            "0.28136505239308973",
            "0.28892541424192614",
            "0.2976249381494309",
            "0.29665372092110937",
            "0.29931997794523063",
            "0.2972954302096646",
            "0.29369665134602757",
            "0.2941884402216943",
            "0.29653890683078415",
            "0.2964722822174226",
            "0.2947176885752095",
            "0.29548363015889945",
            "0.29983870154745706",
            "0.2996520801685696",
            "0.3020433319110606",
            "0.29941386047580737",
            "0.300766668901853",
            "0.3003004950602071",
            "0.30014357949934456",
            "0.30200513930760986",
            "0.30118273211117685",
            "0.3039476686696585",
            "0.3015051916037948",
            "0.29940876059380217",
            "0.297207744523848",
            "0.29529166447633565",
            "0.2921424919038691",
            "0.28827634801865587",
            "0.2882857190786936",
            "0.2882857190786936"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "5023",
        "input_tokens": "313881",
        "output_tokens": "870368",
        "mean_ttft": "170.80",
        "median_ttft": "153.66",
        "p99_ttft": "392.80",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06158730158730158",
            "0.06979062811565304",
            "0.09454949944382646",
            "0.11167971101745934",
            "0.1133494493687886",
            "0.13514186162269784",
            "0.16147016312203177",
            "0.21859785783836413",
            "0.2380352644836272",
            "0.2537808926595352",
            "0.2710606721955478",
            "0.2792619642513934",
            "0.2728375801698734",
            "0.2772300654625759",
            "0.2711107858919947",
            "0.2728909636545515",
            "0.28073518564052125",
            "0.2861783984041037",
            "0.28328414274215186",
            "0.2817353225724324",
            "0.281506655338431",
            "0.29314743138634763",
            "0.296436976177697",
            "0.29615067038886483",
            "0.29939282428702846",
            "0.29722895739521993",
            "0.29534531568898537",
            "0.2945517000095416",
            "0.29802601377199694",
            "0.2976902841615355",
            "0.2961404285951602",
            "0.29650525415118045",
            "0.30289441500203834",
            "0.3009653745751859",
            "0.3031167534412666",
            "0.3034164485466317",
            "0.30255327749208416",
            "0.3020261026298074",
            "0.30166489106139416",
            "0.303872002598932",
            "0.3034719753525299",
            "0.30632211309240004",
            "0.3038958606480614",
            "0.3014466214978941",
            "0.299629842593258",
            "0.29761737419173445",
            "0.29357813863554677",
            "0.290489167003095",
            "0.290489167003095",
            "0.290489167003095"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 5750 ",
        "size": 5750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "5022",
        "input_tokens": "313879",
        "output_tokens": "869699",
        "mean_ttft": "172.95",
        "median_ttft": "155.48",
        "p99_ttft": "408.40",
        "hit_ratios": [
            "0.0394088669950739",
            "0.061121613106490225",
            "0.06854043392504931",
            "0.0750828119249172",
            "0.09401963701279382",
            "0.09751485683414371",
            "0.1038895859473024",
            "0.12574850299401197",
            "0.1480038948393379",
            "0.1719843268961657",
            "0.17891491985203456",
            "0.19030990833697078",
            "0.19844320584278305",
            "0.19613451204714857",
            "0.194216829498897",
            "0.1899604858773599",
            "0.1871957319106369",
            "0.19141873616916646",
            "0.187720898415232",
            "0.18406224845720418",
            "0.18442894241050975",
            "0.18104874934985107",
            "0.18618473188341997",
            "0.1883740173769135",
            "0.18533548717544623",
            "0.18338540709428422",
            "0.18075003465964237",
            "0.17953954085833804",
            "0.17803729396041504",
            "0.18172075933864063",
            "0.1784846732215154",
            "0.1772428884026259",
            "0.18131354914467196",
            "0.18375992491311743",
            "0.18443178736099813",
            "0.18580405598400462",
            "0.18532791803203033",
            "0.18340002697720434",
            "0.18130938435506969",
            "0.1820291915854628",
            "0.18725990365657844",
            "0.18560838193140264",
            "0.18700847522333364",
            "0.1852233741399674",
            "0.18294582165301676",
            "0.18251793633053326",
            "0.181556043956044",
            "0.1782110484008894",
            "0.17608538289311992",
            "0.17608538289311992",
            "0.17608538289311992"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 3750 ",
        "size": 3750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "5030",
        "input_tokens": "314006",
        "output_tokens": "870307",
        "mean_ttft": "170.66",
        "median_ttft": "151.61",
        "p99_ttft": "416.10",
        "hit_ratios": [
            "0.03944773175542406",
            "0.061626429479034316",
            "0.06986027944111775",
            "0.06599552572706935",
            "0.07272727272727272",
            "0.07293354943273907",
            "0.07028112449799197",
            "0.07729775518847946",
            "0.10650298606502986",
            "0.11675490055801975",
            "0.11510971786833857",
            "0.12608792680205314",
            "0.12965884440938674",
            "0.12684444444444448",
            "0.12132739781464996",
            "0.11682558750656957",
            "0.12407610183410897",
            "0.13276854017828918",
            "0.13528755213534632",
            "0.1343093217989242",
            "0.13425583606211053",
            "0.12987076561582145",
            "0.13133672207720842",
            "0.13041605650788182",
            "0.13455081483907955",
            "0.1328292907583666",
            "0.13669870636698706",
            "0.1375497871171542",
            "0.13856001061254267",
            "0.1377925141873366",
            "0.13516373862296271",
            "0.13465937056660585",
            "0.14038623005877415",
            "0.13727983048602835",
            "0.13550414756041015",
            "0.13597627828167053",
            "0.13483200154038705",
            "0.1336626676076218",
            "0.13247194831689907",
            "0.13251434681097127",
            "0.1344473661888201",
            "0.13391824938067715",
            "0.13244056515414207",
            "0.13493335418051056",
            "0.13433150165616806",
            "0.1346964111052592",
            "0.13295412844036697",
            "0.13039525057495854",
            "0.1290096406660824",
            "0.1290096406660824",
            "0.1290096406660824"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "5027",
        "input_tokens": "313986",
        "output_tokens": "871119",
        "mean_ttft": "169.09",
        "median_ttft": "149.65",
        "p99_ttft": "389.22",
        "hit_ratios": [
            "0.03944773175542406",
            "0.061626429479034316",
            "0.06986027944111775",
            "0.08483954260420509",
            "0.106184012066365",
            "0.10516355771830224",
            "0.10618347693867206",
            "0.12393073231796368",
            "0.16029265048220817",
            "0.18954435080702756",
            "0.20260782347041123",
            "0.22022145173917904",
            "0.22907228678353359",
            "0.22280623608017816",
            "0.2194884287454324",
            "0.2186841312857573",
            "0.23115405701754382",
            "0.24000506072874495",
            "0.24175566248092945",
            "0.23868175765645808",
            "0.24280509056344723",
            "0.24042751385007605",
            "0.24278438030560273",
            "0.24472755444607044",
            "0.2515723270440252",
            "0.25551527306386923",
            "0.257182240278584",
            "0.26309626313070444",
            "0.26393000898173724",
            "0.2683917604913",
            "0.2678500986193295",
            "0.26477761003367795",
            "0.2702589340640905",
            "0.2671700922651493",
            "0.2638763217083323",
            "0.26261238761238764",
            "0.2619887846852944",
            "0.2604766399244927",
            "0.2587710311226465",
            "0.2559940497024851",
            "0.2577077962201436",
            "0.2565581935912336",
            "0.2541700875067582",
            "0.25509883286831453",
            "0.2532135160098522",
            "0.25337212377677865",
            "0.2479297871949764",
            "0.24477339442972723",
            "0.24182442546447128",
            "0.24182442546447128",
            "0.24182442546447128"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "5017",
        "input_tokens": "313757",
        "output_tokens": "869833",
        "mean_ttft": "171.31",
        "median_ttft": "153.05",
        "p99_ttft": "405.39",
        "hit_ratios": [
            "0.03933136676499509",
            "0.061626429479034316",
            "0.06993006993006994",
            "0.08524833209785025",
            "0.106184012066365",
            "0.10576142818501487",
            "0.10654490106544899",
            "0.11844863731656184",
            "0.15617253346554286",
            "0.18208955223880594",
            "0.19387373926036602",
            "0.2154220061864781",
            "0.2251513376293692",
            "0.21849405548216644",
            "0.21588447653429602",
            "0.2137535389658769",
            "0.2272388312656769",
            "0.2359121896303709",
            "0.2377196543524909",
            "0.2333588370313696",
            "0.23705438459536823",
            "0.2339653671277934",
            "0.23398947750362845",
            "0.2348768054375531",
            "0.2392109009558674",
            "0.24299207800121878",
            "0.24552851356679448",
            "0.2515789833054522",
            "0.2532516711119892",
            "0.2563972476773314",
            "0.25816807176502354",
            "0.25531731432513216",
            "0.2594537523269706",
            "0.25937623371496255",
            "0.25628886557309927",
            "0.25587202690006433",
            "0.25524994020569247",
            "0.25391227168683145",
            "0.2526918051989008",
            "0.25094941516026126",
            "0.2525303643724697",
            "0.25246997089328904",
            "0.25004942469653235",
            "0.2505093625691278",
            "0.24801643929448028",
            "0.24826259154087585",
            "0.24365020119075798",
            "0.24016585158409529",
            "0.23754909662215243",
            "0.23754909662215243",
            "0.23754909662215243"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 6000 ",
        "size": 6000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "5011",
        "input_tokens": "313161",
        "output_tokens": "869962",
        "mean_ttft": "174.64",
        "median_ttft": "158.58",
        "p99_ttft": "409.56",
        "hit_ratios": [
            "0.03944773175542406",
            "0.061626429479034316",
            "0.06986027944111775",
            "0.06599552572706935",
            "0.07261724659606655",
            "0.07283517669274346",
            "0.0709040263357812",
            "0.07689057879171947",
            "0.10876785121222185",
            "0.11871949468848693",
            "0.11682595573440643",
            "0.12788612418740192",
            "0.1325585975970061",
            "0.12940445548948257",
            "0.12354651162790697",
            "0.11899227712379096",
            "0.1273807085807905",
            "0.13570753230381344",
            "0.13634501726256656",
            "0.1352811466372657",
            "0.134325230511316",
            "0.13049631545556586",
            "0.1324029014782848",
            "0.13052595540719816",
            "0.1358110031309722",
            "0.13336642358061926",
            "0.13329010411037856",
            "0.13422772853280393",
            "0.13298294327647756",
            "0.13280702871331249",
            "0.1301768019035571",
            "0.13058399423215572",
            "0.13639264212190993",
            "0.13398104516333986",
            "0.13248237171238872",
            "0.132450001245299",
            "0.1325873586225191",
            "0.13081716637272192",
            "0.12979799124855465",
            "0.12993758456636548",
            "0.13222702611054593",
            "0.13163210619614954",
            "0.12989493791786053",
            "0.13200726860626424",
            "0.13091124305542295",
            "0.13081346344752665",
            "0.1293286477780218",
            "0.12699713232281853",
            "0.1259127931470299",
            "0.1259127931470299",
            "0.1259127931470299"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 4000 ",
        "size": 4000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "5027",
        "input_tokens": "313986",
        "output_tokens": "870160",
        "mean_ttft": "167.44",
        "median_ttft": "147.77",
        "p99_ttft": "368.77",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06158730158730158",
            "0.06979062811565304",
            "0.08796466691203533",
            "0.11386288130474176",
            "0.12459807073954983",
            "0.15669232679413955",
            "0.19912700062357097",
            "0.26916221033868093",
            "0.3037037037037037",
            "0.3239695780176644",
            "0.34078273193066605",
            "0.34901584253480555",
            "0.3413007707629687",
            "0.3553751576292559",
            "0.3488848263254113",
            "0.3513963873891888",
            "0.35829139560574447",
            "0.36476554042504705",
            "0.3656404205106201",
            "0.36314128664495116",
            "0.36673743807501774",
            "0.37950296899054325",
            "0.38124845590051887",
            "0.3867787422915276",
            "0.39265474350482077",
            "0.39529737206085747",
            "0.3980911634029949",
            "0.4013758559472483",
            "0.4034643652221646",
            "0.406150919467343",
            "0.40139620871388754",
            "0.4018179885179672",
            "0.4018247529506912",
            "0.4030661130629191",
            "0.4085064996679001",
            "0.4089803039346219",
            "0.4070762749843148",
            "0.40742582821555223",
            "0.40375655212580086",
            "0.40674494534688",
            "0.40574360998717063",
            "0.40623511252548733",
            "0.4042330220633643",
            "0.40214123340910757",
            "0.399715581797235",
            "0.3959389972095962",
            "0.3909666626837137",
            "0.3861131644378738",
            "0.3861131644378738",
            "0.3861131644378738"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "5030",
        "input_tokens": "314006",
        "output_tokens": "870042",
        "mean_ttft": "159.78",
        "median_ttft": "141.33",
        "p99_ttft": "332.38",
        "hit_ratios": [
            "0.036926147704590816",
            "0.060082872928176795",
            "0.07063572149344097",
            "0.08753709198813057",
            "0.11437216338880482",
            "0.1291801510248112",
            "0.16314874596473802",
            "0.2253169819164415",
            "0.2993031923513207",
            "0.3296995108315863",
            "0.3552550706822373",
            "0.3725062683963807",
            "0.38108497359577537",
            "0.37724084177708495",
            "0.394546027742749",
            "0.39619893686739965",
            "0.40578550956475373",
            "0.4124224365669349",
            "0.4165004843028887",
            "0.4200278910105128",
            "0.42279112377850164",
            "0.43448926633640017",
            "0.44531421786358233",
            "0.45303456259302144",
            "0.4576191225035383",
            "0.4658547354477887",
            "0.4731710690084359",
            "0.47616074655801266",
            "0.47801692712460775",
            "0.480652538496722",
            "0.48002766730070906",
            "0.47954200579390266",
            "0.48004533951919015",
            "0.4833295417203812",
            "0.48474042741558665",
            "0.487979855568225",
            "0.4874248474000642",
            "0.48510991104040146",
            "0.4829555286381726",
            "0.48177565235471453",
            "0.4839618815896187",
            "0.4832662404293945",
            "0.48537188510557344",
            "0.4865142899895255",
            "0.48274411544159324",
            "0.4796978960618593",
            "0.4731038098566933",
            "0.47109634551495005",
            "0.4668133418427327",
            "0.4661512920698269",
            "0.4661512920698269"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "5025",
        "input_tokens": "313898",
        "output_tokens": "870619",
        "mean_ttft": "165.87",
        "median_ttft": "145.70",
        "p99_ttft": "350.37",
        "hit_ratios": [
            "0.0394088669950739",
            "0.06182281708094328",
            "0.07107355864811132",
            "0.09454949944382646",
            "0.12008469449485783",
            "0.13344051446945338",
            "0.16786689843555996",
            "0.22926626480981088",
            "0.30238210986874087",
            "0.33240145373217783",
            "0.3581943081452405",
            "0.37557102458124864",
            "0.3829092654824773",
            "0.3788862908114662",
            "0.39555940477127793",
            "0.39931765389082463",
            "0.40698526961274417",
            "0.41352829145419917",
            "0.4175260668907755",
            "0.420970769643336",
            "0.42370724755700323",
            "0.43533852323661243",
            "0.4469570562922631",
            "0.4531488746644642",
            "0.45894861193148256",
            "0.4674730786251659",
            "0.4737206085753803",
            "0.47671629038088664",
            "0.4785696170428607",
            "0.4811991095117563",
            "0.4805441863146365",
            "0.4800364228360145",
            "0.48014056011074435",
            "0.48153473588618134",
            "0.4827357889057826",
            "0.4865717674970344",
            "0.4864072555710786",
            "0.4836140751180011",
            "0.48023625624716054",
            "0.47936223799512945",
            "0.4827278985947436",
            "0.48171309082300967",
            "0.4833742553150995",
            "0.4838354014052925",
            "0.4806766380462445",
            "0.47703205623775213",
            "0.47107900582442785",
            "0.4690703187624718",
            "0.46506630854456965",
            "0.46506630854456965",
            "0.46506630854456965"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "5022",
        "input_tokens": "313879",
        "output_tokens": "871277",
        "mean_ttft": "167.99",
        "median_ttft": "148.72",
        "p99_ttft": "377.95",
        "hit_ratios": [
            "0.03929273084479371",
            "0.06158730158730158",
            "0.06986027944111775",
            "0.09541420118343194",
            "0.11978221415607984",
            "0.12968917470525188",
            "0.16141047926496152",
            "0.20307628351694035",
            "0.2722411278561011",
            "0.30635918937805734",
            "0.3257184966838615",
            "0.34289140863497597",
            "0.3507441190590494",
            "0.34285961721659297",
            "0.3562421185372004",
            "0.349689213893967",
            "0.3521295740851829",
            "0.3583584198562388",
            "0.3653922853398666",
            "0.3662304226560824",
            "0.3637011400651465",
            "0.36650153338051417",
            "0.37959991206858634",
            "0.3815166851828991",
            "0.38641989862077086",
            "0.3931268186673541",
            "0.3956871824999134",
            "0.39929711620574115",
            "0.4017616678812458",
            "0.40383384634138897",
            "0.40649938059980983",
            "0.4016217110706602",
            "0.40203501501022815",
            "0.40090192799777047",
            "0.40217203930356826",
            "0.4083689966714216",
            "0.408465899960976",
            "0.40649420641336564",
            "0.4068648695501429",
            "0.4035223009587327",
            "0.40674180119809106",
            "0.4055251240878798",
            "0.405394571068606",
            "0.4031045537204026",
            "0.40020153902528394",
            "0.39676375404530745",
            "0.39440212515173373",
            "0.388861364995302",
            "0.3846309301268125",
            "0.3846309301268125",
            "0.3846309301268125"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 7750 ",
        "size": 7750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "5021",
        "input_tokens": "313871",
        "output_tokens": "870898",
        "mean_ttft": "164.86",
        "median_ttft": "145.71",
        "p99_ttft": "355.55",
        "hit_ratios": [
            "0.03696303696303697",
            "0.06012439530062197",
            "0.06986027944111775",
            "0.08389261744966442",
            "0.10749086479902557",
            "0.11480774475047723",
            "0.1248426881449786",
            "0.1522756273925989",
            "0.2098436980379115",
            "0.245724960482828",
            "0.25575833857772184",
            "0.27614968440036064",
            "0.29146426092990974",
            "0.29540989462404",
            "0.2933452944054803",
            "0.28719461462824286",
            "0.3012578184067633",
            "0.3153358681875792",
            "0.3125773195876288",
            "0.30892996325576216",
            "0.3100475938656795",
            "0.30714565771417374",
            "0.3165457717381324",
            "0.3210009940787483",
            "0.33088931910862135",
            "0.3312957016288157",
            "0.3341728719521098",
            "0.3397566977437355",
            "0.34051608579088477",
            "0.34286910859830555",
            "0.3440817571690055",
            "0.3406741047958409",
            "0.34632070982730156",
            "0.345714895205589",
            "0.34608704668584905",
            "0.3478914530557017",
            "0.3472524285921415",
            "0.3447615444636228",
            "0.3421076642335765",
            "0.3389626319709115",
            "0.3413629768712126",
            "0.3426267567679614",
            "0.3440113650006001",
            "0.34500982318271106",
            "0.34253771551724127",
            "0.3411629093520285",
            "0.3361395511276951",
            "0.33287384306915624",
            "0.3291239704403957",
            "0.3291239704403957",
            "0.3291239704403957"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "5023",
        "input_tokens": "313881",
        "output_tokens": "869796",
        "mean_ttft": "159.69",
        "median_ttft": "140.23",
        "p99_ttft": "355.35",
        "hit_ratios": [
            "0.03696303696303697",
            "0.06163934426229509",
            "0.06986027944111775",
            "0.08706928492034087",
            "0.10867579908675798",
            "0.12388181078883165",
            "0.15204236006051436",
            "0.20168421052631577",
            "0.2675358970127083",
            "0.3028969042885543",
            "0.3234117058529264",
            "0.343518211004096",
            "0.3483498188228381",
            "0.3494690265486726",
            "0.3580666020045264",
            "0.36383911976804706",
            "0.3683744379343235",
            "0.3826524198617222",
            "0.3804462095549586",
            "0.3778302923719499",
            "0.37875772493977167",
            "0.37638556570145026",
            "0.3843619892940477",
            "0.39276053072265876",
            "0.4017055471280391",
            "0.40740597878495666",
            "0.4114780331684609",
            "0.41677286034096783",
            "0.42007261583558175",
            "0.4221738852280724",
            "0.4247908330301928",
            "0.42642503546304605",
            "0.4282700421940928",
            "0.4275946146506943",
            "0.4290207806940648",
            "0.4291419158388658",
            "0.43171382551626314",
            "0.42707183617875677",
            "0.42539696921648124",
            "0.4241514360313316",
            "0.42533706436021373",
            "0.426465737610291",
            "0.4254549070299294",
            "0.42603411555520815",
            "0.42415043909889266",
            "0.4230978617957911",
            "0.4174928920317853",
            "0.4163990846032393",
            "0.412339934224337",
            "0.4120464238271691",
            "0.4120464238271691"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "5030",
        "input_tokens": "314006",
        "output_tokens": "873326",
        "mean_ttft": "167.28",
        "median_ttft": "146.91",
        "p99_ttft": "371.72",
        "hit_ratios": [
            "0.03944773175542406",
            "0.061626429479034316",
            "0.06986027944111775",
            "0.08475836431226766",
            "0.11212121212121211",
            "0.12675296655879179",
            "0.15457967377666246",
            "0.19831401475237093",
            "0.2618061309030654",
            "0.2980481550078358",
            "0.32034089484897854",
            "0.34083850931677007",
            "0.3455810307662159",
            "0.345904694294081",
            "0.3572120820545953",
            "0.3586305064429127",
            "0.3675277758843977",
            "0.3812723732964893",
            "0.379489575424867",
            "0.377610049033111",
            "0.3776974649067672",
            "0.37497566673155525",
            "0.3825380895903658",
            "0.3893172277906279",
            "0.4005973569002905",
            "0.40681147760793773",
            "0.41181782063784445",
            "0.4161004735433395",
            "0.420921915358633",
            "0.42259800643291606",
            "0.42380348844227167",
            "0.4228847098246526",
            "0.4217943351472024",
            "0.42382776383568876",
            "0.42570394517313065",
            "0.42713205294059103",
            "0.42717605735456854",
            "0.4236937888928025",
            "0.4209893078477218",
            "0.42079724966273546",
            "0.4217434636018574",
            "0.42251893431289583",
            "0.4217198352206013",
            "0.42122016951138525",
            "0.4188599846977811",
            "0.417683957480374",
            "0.41382404101437326",
            "0.4118589173221339",
            "0.4072990398766556",
            "0.40703456003361455",
            "0.40703456003361455"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "5029",
        "input_tokens": "313999",
        "output_tokens": "872182",
        "mean_ttft": "169.76",
        "median_ttft": "150.49",
        "p99_ttft": "364.98",
        "hit_ratios": [
            "0.03944773175542406",
            "0.06254158349966733",
            "0.06986027944111775",
            "0.08517699115044249",
            "0.11147540983606556",
            "0.11942718184274519",
            "0.12986686762120067",
            "0.15663661144894106",
            "0.21193585716647376",
            "0.24806866952789697",
            "0.25678733031674206",
            "0.27736081550352865",
            "0.2918429597559775",
            "0.29654006937650096",
            "0.29632041680234456",
            "0.2919086041776639",
            "0.30550414696003836",
            "0.31795455983798493",
            "0.3169629760018776",
            "0.3131956365247245",
            "0.31480700274203754",
            "0.3104022735067863",
            "0.31726390358342155",
            "0.3226489265195042",
            "0.3324544780423499",
            "0.336327578161456",
            "0.337928519328957",
            "0.3429988553987029",
            "0.3462554771381745",
            "0.34915276036140336",
            "0.3486246915836609",
            "0.3448668203168307",
            "0.3463512294157457",
            "0.35196759569730957",
            "0.3522948648016833",
            "0.35369904378460015",
            "0.35231359968892795",
            "0.3490003090602194",
            "0.3470576098668075",
            "0.3436709000066034",
            "0.34554457567897817",
            "0.3470152360336361",
            "0.34878671518465676",
            "0.3494445103388291",
            "0.3458679999227846",
            "0.34466010207372855",
            "0.3400170017740983",
            "0.33614064071254146",
            "0.3317912134482273",
            "0.3317912134482273",
            "0.3317912134482273"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 8000 ",
        "size": 8000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys_0514",
        "scale": 1,
        "result_file": "lmsys-size+++/client_logs/8000_lru.json"
    }
]