[
    {
        "num_requests": "4909",
        "input_tokens": "304274",
        "output_tokens": "866848",
        "mean_ttft": "170.44",
        "median_ttft": "150.80",
        "p99_ttft": "370.24",
        "hit_ratios": [
            "0.03929273084479371",
            "0.06158730158730158",
            "0.07051282051282051",
            "0.09492273730684327",
            "0.11990335246149199",
            "0.13344051446945338",
            "0.16786689843555996",
            "0.21430056121388488",
            "0.2689506785832506",
            "0.30514496873223423",
            "0.32777915941308133",
            "0.34697450486924175",
            "0.35492957746478876",
            "0.35679887925750814",
            "0.364875637755102",
            "0.3703839122486288",
            "0.37528573349468863",
            "0.3897773403862714",
            "0.38836165255441263",
            "0.38954017450885925",
            "0.3863868464052288",
            "0.3835328912846443",
            "0.39364689364689354",
            "0.4026787554090253",
            "0.4107400898262058",
            "0.4172037498169035",
            "0.42115747896273403",
            "0.42419525765001986",
            "0.428361310951239",
            "0.42878464818763323",
            "0.42760233242884355",
            "0.4275362318840579",
            "0.4298885592880622",
            "0.4285786892328022",
            "0.42966872320919736",
            "0.4298373420593785",
            "0.43105197620255487",
            "0.4290987665436211",
            "0.42591870341480315",
            "0.42623917760316826",
            "0.4293150964580994",
            "0.42821890547263675",
            "0.4270650263620386",
            "0.4253480102889998",
            "0.42334053834358654",
            "0.42284598133545526",
            "0.41751994915613294",
            "0.41472379933387393",
            "0.411398451093446",
            "0.411398451093446"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m/lmsys-chat-1m_epoch4_metric_0_6818.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 1,
        "result_file": "lmsys-reqrate+/client_logs/8000_lru.json"
    },
    {
        "num_requests": "6615",
        "input_tokens": "398563",
        "output_tokens": "1164458",
        "mean_ttft": "185.96",
        "median_ttft": "186.02",
        "p99_ttft": "364.80",
        "hit_ratios": [
            "0.028028028028028028",
            "0.060072815533980584",
            "0.08104517271922054",
            "0.11877789220734636",
            "0.13411896745230079",
            "0.1704878048780488",
            "0.20608251807741385",
            "0.22610809799887788",
            "0.22627857260319023",
            "0.2281340003031681",
            "0.24909066415196013",
            "0.25384707145413343",
            "0.2713983050847458",
            "0.27628291370363245",
            "0.3012490173814306",
            "0.3145417063114494",
            "0.32379723237972324",
            "0.33459319673761684",
            "0.33931203931203924",
            "0.3464325693748895",
            "0.3523255813953488",
            "0.3574950951800201",
            "0.36641068112232084",
            "0.3719143213908365",
            "0.3780465372942149",
            "0.38704478132078746",
            "0.38961414525324284",
            "0.393758168640342",
            "0.3992302177276328",
            "0.40399709302325565",
            "0.4088342283041745",
            "0.4036353916065222",
            "0.3997257232416899",
            "0.40234781785477597",
            "0.40771049281687566",
            "0.4060647379653782",
            "0.4060456579098312",
            "0.41346548750102663",
            "0.41460147354320154",
            "0.4199025965570226",
            "0.42380976320949165",
            "0.42304032789284923",
            "0.4265386150703266",
            "0.42600082731994304",
            "0.42905202183357477",
            "0.43223022206800843",
            "0.43335736397947516",
            "0.43664207098396485",
            "0.4387444885139626",
            "0.43855218855218864",
            "0.44046342397548843",
            "0.44173184357541906",
            "0.44364800698600987",
            "0.44292997238547055",
            "0.44828299188448756",
            "0.4491792238403906",
            "0.4480364219973143",
            "0.44768911283182283",
            "0.44840495566236777",
            "0.4485781916715982",
            "0.4475981190644498",
            "0.44763031737362713",
            "0.4478868597282358",
            "0.4479886585149745",
            "0.4471907823911084",
            "0.44579196183524217",
            "0.4447645254679395",
            "0.4447645254679395"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m/lmsys-chat-1m_epoch4_metric_0_6818.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 2,
        "result_file": "lmsys-reqrate+/client_logs/8001_lru.json"
    },
    {
        "num_requests": "8306",
        "input_tokens": "484485",
        "output_tokens": "1428493",
        "mean_ttft": "203.89",
        "median_ttft": "205.34",
        "p99_ttft": "390.07",
        "hit_ratios": [
            "0.03887269193391643",
            "0.0803727431566686",
            "0.09637526652452026",
            "0.15533088235294118",
            "0.16573886639676114",
            "0.19357014388489208",
            "0.21920792079207918",
            "0.23236587510993836",
            "0.2391233766233766",
            "0.2323682256867112",
            "0.23554264589384735",
            "0.2502937720329025",
            "0.2573784722222222",
            "0.25789897363654657",
            "0.2672630696114062",
            "0.2699831365935919",
            "0.2810844499844188",
            "0.28405776481468303",
            "0.28356387306753456",
            "0.2926360315323976",
            "0.29675613170227005",
            "0.30478328440683816",
            "0.3072981958903363",
            "0.31112856768787645",
            "0.31718575631530893",
            "0.3220028004442084",
            "0.32273345527883307",
            "0.3298656655660591",
            "0.33458225667527997",
            "0.33251732293265845",
            "0.33226401475659645",
            "0.3351391378907163",
            "0.34207457014936604",
            "0.34496067579376644",
            "0.342416434294589",
            "0.3441445140100585",
            "0.3464739961377106",
            "0.34971209213051824",
            "0.35200247409927327",
            "0.35203186777252593",
            "0.3541055079203604",
            "0.3582001016891701",
            "0.3631321548591569",
            "0.36601875263379685",
            "0.3667270844122217",
            "0.37208890238963155",
            "0.37216431637032504",
            "0.3753176129752322",
            "0.37623462541930686",
            "0.3805142453711085",
            "0.38343680709534367",
            "0.3860180398433951",
            "0.38854335771963483",
            "0.3896889221370239",
            "0.3917750239098142",
            "0.39377430370501965",
            "0.3932412269653342",
            "0.39410993022415725",
            "0.39487457475045795",
            "0.3958818958818959",
            "0.3982176702143169",
            "0.40040241448692154",
            "0.40039914519347947",
            "0.4008725578808316",
            "0.39954099371435425",
            "0.39919001012487343",
            "0.3977619363395225",
            "0.3971199476354116",
            "0.39546375050627786",
            "0.39657834009707965",
            "0.39712205379280047",
            "0.39733337458043966",
            "0.3979465554384196",
            "0.3975981579858237",
            "0.39878805793674255",
            "0.40063210392020415",
            "0.4015917924096936",
            "0.40028625278104507",
            "0.4003771476463193",
            "0.40282797191265995",
            "0.4034281388558452",
            "0.40248551897582713",
            "0.40193510169156854",
            "0.40102767109281817",
            "0.40102767109281817"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.03,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m/lmsys-chat-1m_epoch4_metric_0_6818.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 3,
        "result_file": "lmsys-reqrate+/client_logs/8002_lru.json"
    },
    {
        "num_requests": "9571",
        "input_tokens": "557844",
        "output_tokens": "1676559",
        "mean_ttft": "219.37",
        "median_ttft": "219.10",
        "p99_ttft": "448.19",
        "hit_ratios": [
            "0.04407443682664055",
            "0.0975473801560758",
            "0.11933656957928802",
            "0.16980568011958147",
            "0.1813627254509018",
            "0.20166631061738943",
            "0.21200311769290728",
            "0.22060627299807253",
            "0.2173230817511376",
            "0.2267806267806268",
            "0.2338129496402878",
            "0.23431156478366777",
            "0.23529411764705885",
            "0.23994238090338516",
            "0.24366509297620198",
            "0.24263176144244109",
            "0.24177763516765605",
            "0.2425415622864951",
            "0.24684799546678",
            "0.26146055437100213",
            "0.26494023904382474",
            "0.2718376223269301",
            "0.28197823485841267",
            "0.284020390070922",
            "0.2922682569575225",
            "0.29498941425546926",
            "0.3002482597478459",
            "0.3001751810993797",
            "0.30217331999636254",
            "0.30189673340358264",
            "0.30317223759846706",
            "0.30484873601326146",
            "0.3044247787610619",
            "0.30416764406912183",
            "0.30807199851549444",
            "0.3097072419106317",
            "0.3121220644072563",
            "0.31539718194813143",
            "0.3190620471611118",
            "0.32128176080271886",
            "0.3241899968543567",
            "0.3229080428050164",
            "0.32670345560244335",
            "0.32770620039111925",
            "0.3306010161974005",
            "0.33106638398634314",
            "0.3289907519099316",
            "0.3307950845499421",
            "0.33410678769952556",
            "0.3351073132948553",
            "0.33629133934632904",
            "0.3418269572006528",
            "0.3449035940509059",
            "0.3448470737165719",
            "0.3464743660970242",
            "0.3470683186458423",
            "0.34792611864880546",
            "0.34782331434401825",
            "0.349262868565717",
            "0.3508108991380365",
            "0.3521483746379142",
            "0.35080006337135594",
            "0.3500868580797531",
            "0.34978524165151087",
            "0.347574180312298",
            "0.347465576107755",
            "0.3477551927958641",
            "0.34870490963635015",
            "0.34805330076862273",
            "0.3480659088906509",
            "0.34843271840799434",
            "0.3471022379429968",
            "0.3485202752354864",
            "0.34844990610483284",
            "0.3479325441868004",
            "0.3482623631860666",
            "0.348719803724207",
            "0.3485250120138272",
            "0.34986550100874214",
            "0.349372227652056",
            "0.3502370858383677",
            "0.3504914112397559",
            "0.35032771804749013",
            "0.35060192845324334",
            "0.3511654188444693",
            "0.35213389121338884",
            "0.35279808677827096",
            "0.35203079159152667",
            "0.35404630009122495",
            "0.3561574170665551",
            "0.35622803743129633",
            "0.35719363274010485",
            "0.3568213642728543",
            "0.35626826471349804",
            "0.35393539720339473",
            "0.3529816846276516",
            "0.352842486421243",
            "0.352842486421243"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.04,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m/lmsys-chat-1m_epoch4_metric_0_6818.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 4,
        "result_file": "lmsys-reqrate+/client_logs/8003_lru.json"
    },
    {
        "num_requests": "4020",
        "input_tokens": "272121",
        "output_tokens": "715227",
        "mean_ttft": "171.40",
        "median_ttft": "150.42",
        "p99_ttft": "397.23",
        "hit_ratios": [
            "0.01331967213114754",
            "0.028827674567584886",
            "0.03799392097264438",
            "0.06050096339113681",
            "0.06361829025844931",
            "0.08508088675853806",
            "0.12233169129720854",
            "0.23162675474814204",
            "0.2505982905982906",
            "0.26184052757793763",
            "0.2794639337800552",
            "0.3014413800930655",
            "0.3212450592885376",
            "0.34838257210484785",
            "0.37715415019762843",
            "0.38272043163424674",
            "0.39013538422424204",
            "0.3937437643054169",
            "0.39828126689006593",
            "0.39796498114766804",
            "0.3957650856952951",
            "0.39890857040615496",
            "0.3983856653847779",
            "0.40723426171704774",
            "0.4151794172255694",
            "0.419084882078035",
            "0.4137883488452258",
            "0.40808726601634593",
            "0.4081288392374041",
            "0.4025986078886311",
            "0.3965366661647343",
            "0.3870231019236964",
            "0.3852694473170172",
            "0.3785380329796467",
            "0.3707414282594454",
            "0.36472748562912505",
            "0.35829499043581664",
            "0.35124465677646466",
            "0.3452893937910097",
            "0.34500952660120177",
            "0.34500952660120177"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m/lmsys-chat-1m_epoch4_metric_0_6818.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 0.5,
        "result_file": "lmsys-reqrate+/client_logs/8001_lru.json"
    },
    {
        "num_requests": "3900",
        "input_tokens": "278653",
        "output_tokens": "703398",
        "mean_ttft": "174.94",
        "median_ttft": "160.54",
        "p99_ttft": "418.29",
        "hit_ratios": [
            "0.01331967213114754",
            "0.054334554334554336",
            "0.05427782888684452",
            "0.055404881828748545",
            "0.06134371957156767",
            "0.0637904468412943",
            "0.12573885008060184",
            "0.19750161533491278",
            "0.23260754115772703",
            "0.27248079530049707",
            "0.28521806252412196",
            "0.3108790838666218",
            "0.3216380081502833",
            "0.33679795769511306",
            "0.3459387261040154",
            "0.3565527173501099",
            "0.3485807782599416",
            "0.3497802636835796",
            "0.342774637503072",
            "0.3420134852359916",
            "0.33955511507543223",
            "0.3381662668196516",
            "0.34042765289338583",
            "0.34205221956593074",
            "0.3398062606511795",
            "0.3347529442440572",
            "0.3281079721686646",
            "0.3262204978984804",
            "0.32416549130230365",
            "0.3183230990827079",
            "0.31223005648049024",
            "0.3016114751195325",
            "0.2958706125258087",
            "0.2896360785883452",
            "0.28334036545389635",
            "0.27775856105153934",
            "0.2718511946645456",
            "0.2683212996389892",
            "0.2683212996389892",
            "0.2683212996389892"
        ],
        "args": "--num-gpu-blocks-override 10000  --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 ",
        "size": 10000,
        "num_prompts": 50000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m/lmsys-chat-1m_epoch4_metric_0_6818.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 0.25,
        "result_file": "lmsys-reqrate+/client_logs/8000_lru.json"
    },
    {
        "num_requests": "4114",
        "input_tokens": "278111",
        "output_tokens": "720394",
        "mean_ttft": "176.87",
        "median_ttft": "157.85",
        "p99_ttft": "391.55",
        "hit_ratios": [
            "0.016243654822335026",
            "0.030973451327433628",
            "0.03784056508577195",
            "0.0548102721349176",
            "0.06309562931317779",
            "0.09467803587180242",
            "0.13062213843253434",
            "0.24840107282855373",
            "0.2880297146716191",
            "0.30979228486646876",
            "0.3319294551197683",
            "0.35455680399500616",
            "0.3736145169200587",
            "0.3913421418636995",
            "0.41938526845373786",
            "0.42758571631811065",
            "0.443503003477711",
            "0.4469696969696969",
            "0.4500748342954886",
            "0.4528437355761834",
            "0.4463252522354516",
            "0.45681144020896974",
            "0.45055037391815805",
            "0.45627075755179497",
            "0.4614808434141043",
            "0.4647092647164522",
            "0.4673016091321689",
            "0.4656797208725991",
            "0.4590907648869008",
            "0.45610311307985724",
            "0.44908319894881454",
            "0.4420884699057288",
            "0.4385730528709494",
            "0.43641906873614195",
            "0.43051049102314515",
            "0.4269920844327177",
            "0.4219558002521289",
            "0.4152643930693563",
            "0.406547604623549",
            "0.40603175370339045",
            "0.40603175370339045",
            "0.40603175370339045"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 0.5,
        "result_file": "lmsys-reqrate++/client_logs/8001_ml.json"
    },
    {
        "num_requests": "4002",
        "input_tokens": "288354",
        "output_tokens": "706994",
        "mean_ttft": "187.79",
        "median_ttft": "173.09",
        "p99_ttft": "429.37",
        "hit_ratios": [
            "0.01331967213114754",
            "0.05575539568345323",
            "0.053730017761989345",
            "0.05491990846681922",
            "0.06109324758842444",
            "0.06377079482439926",
            "0.12547017732401933",
            "0.20800172080017207",
            "0.24246231155778894",
            "0.2963019327347436",
            "0.3121118012422361",
            "0.32994235334011535",
            "0.35406268716310646",
            "0.3663575429253513",
            "0.3735868017753957",
            "0.37502851494182954",
            "0.3712737127371274",
            "0.37521803300684287",
            "0.37745764807716087",
            "0.37484716157205233",
            "0.3770917324791517",
            "0.3730300483294809",
            "0.37881965248651883",
            "0.37698748706369367",
            "0.36998474104658474",
            "0.36342683191998265",
            "0.3571158293041834",
            "0.34702099951163934",
            "0.3471457776379935",
            "0.34606878670022123",
            "0.3365740056188083",
            "0.32692990554648116",
            "0.3204503851068975",
            "0.31611357054888006",
            "0.31052750589527417",
            "0.30709653044518614",
            "0.2998016175797346",
            "0.2955610283517541",
            "0.29547228727556607",
            "0.29547228727556607",
            "0.29547228727556607"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 0.25,
        "result_file": "lmsys-reqrate++/client_logs/8000_ml.json"
    },
    {
        "num_requests": "5018",
        "input_tokens": "313802",
        "output_tokens": "871060",
        "mean_ttft": "168.71",
        "median_ttft": "150.83",
        "p99_ttft": "345.07",
        "hit_ratios": [
            "0.03929273084479371",
            "0.06158730158730158",
            "0.07107355864811132",
            "0.09492273730684327",
            "0.11990335246149199",
            "0.13344051446945338",
            "0.16786689843555996",
            "0.22926626480981088",
            "0.30238210986874087",
            "0.3323549965059399",
            "0.3581943081452405",
            "0.3748371689101173",
            "0.38290926548247733",
            "0.37775464167968076",
            "0.3955594047712778",
            "0.3975096482924343",
            "0.40695814449480144",
            "0.41352829145419917",
            "0.4175022789425707",
            "0.4209933490667239",
            "0.42370724755700323",
            "0.43571597074781787",
            "0.44730833406516196",
            "0.45219468006258745",
            "0.4585600504692059",
            "0.4669025504938817",
            "0.4739972337482711",
            "0.47661645727816876",
            "0.4784428100431144",
            "0.48107712482083503",
            "0.4804288926039085",
            "0.4799260506056676",
            "0.4789070629986392",
            "0.4815562395922693",
            "0.4828457838421518",
            "0.4874594415366033",
            "0.4861104744441898",
            "0.48356639445128097",
            "0.4812679492993026",
            "0.4804644496603868",
            "0.4826845963789543",
            "0.48167074421908307",
            "0.4834234165651645",
            "0.48379560406698574",
            "0.4808090052164364",
            "0.47699278945570284",
            "0.47221004261886806",
            "0.4682435317223124",
            "0.46530427037292243",
            "0.46530427037292243",
            "0.46530427037292243"
        ],
        "args": " --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 1,
        "result_file": "lmsys-reqrate++/client_logs/8002_ml.json"
    },
    {
        "num_requests": "6775",
        "input_tokens": "407329",
        "output_tokens": "1169296",
        "mean_ttft": "183.29",
        "median_ttft": "184.08",
        "p99_ttft": "352.79",
        "hit_ratios": [
            "0.027944111776447105",
            "0.060072815533980584",
            "0.08",
            "0.11764705882352941",
            "0.13602015113350127",
            "0.17641441871568395",
            "0.2088098263447692",
            "0.24388422035480858",
            "0.24991751897063672",
            "0.25540664026804755",
            "0.2797193361219809",
            "0.28890481308969307",
            "0.30360753431946363",
            "0.3131039814456899",
            "0.3311403508771929",
            "0.3475250676428457",
            "0.35524525599713574",
            "0.3621045621045621",
            "0.3663735189935264",
            "0.3733255337818076",
            "0.38016026526664837",
            "0.38252868700756176",
            "0.3886172304279881",
            "0.3971105408231157",
            "0.40247805413313836",
            "0.41160365058670156",
            "0.4116658468601411",
            "0.41599557871466936",
            "0.4240827916012853",
            "0.42886991606325886",
            "0.4339706994979023",
            "0.4311373276776248",
            "0.4320371145977642",
            "0.43667714525817813",
            "0.4374342164616728",
            "0.4375329467580391",
            "0.4401687620342055",
            "0.44538413115472",
            "0.44810622090562846",
            "0.4494524227709474",
            "0.45082848074375825",
            "0.4506109731756",
            "0.45448601186306103",
            "0.4534457478005865",
            "0.4560185185185186",
            "0.46067391538378727",
            "0.4605855382156228",
            "0.4640151126260241",
            "0.46461464373858774",
            "0.46495490592442845",
            "0.46528845606241803",
            "0.4656735751295336",
            "0.4663402471634024",
            "0.46855872859083125",
            "0.46967071057192367",
            "0.4747095352564102",
            "0.47406035798979956",
            "0.473896994199332",
            "0.4723480558701396",
            "0.4724334013227023",
            "0.4724559188206478",
            "0.47166156064155706",
            "0.47084715014349654",
            "0.46974536290913343",
            "0.47153745299465477",
            "0.47069526774418247",
            "0.46871958358606874",
            "0.46871958358606874"
        ],
        "args": " --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 9750 ",
        "size": 9750,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 1,
        "algorithm": "ml",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 2,
        "result_file": "lmsys-reqrate++/client_logs/8003_ml.json"
    },
    {
        "num_requests": "4118",
        "input_tokens": "278277",
        "output_tokens": "720395",
        "mean_ttft": "171.93",
        "median_ttft": "150.52",
        "p99_ttft": "369.03",
        "hit_ratios": [
            "0.016243654822335026",
            "0.028535193405199746",
            "0.03733602421796166",
            "0.05469356089992243",
            "0.06148222000664673",
            "0.0867224880382775",
            "0.12377049180327869",
            "0.23576567317574512",
            "0.260942760942761",
            "0.27021813325419203",
            "0.28266950845877187",
            "0.3010815211071055",
            "0.324343363188085",
            "0.34512957998212695",
            "0.3649813038530321",
            "0.37004340469359237",
            "0.38253583818812603",
            "0.38538387018648596",
            "0.3922654994736552",
            "0.39467672528289865",
            "0.38747717965165057",
            "0.3944283547096953",
            "0.39033959632067666",
            "0.3968280055879695",
            "0.40601152468462864",
            "0.41026023970429015",
            "0.4084476843910807",
            "0.40300991982606343",
            "0.4019992741908879",
            "0.4005322048026675",
            "0.39281601145453987",
            "0.3841279420639711",
            "0.38126664693696366",
            "0.377167713314513",
            "0.3696061090990765",
            "0.3634994935807945",
            "0.35803325948268966",
            "0.34881206723467795",
            "0.34346405228758176",
            "0.3434158800110174",
            "0.3434158800110174",
            "0.3434158800110174"
        ],
        "args": " --port 8001  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.005,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 0.5,
        "result_file": "lmsys-reqrate++/client_logs/8001_lru.json"
    },
    {
        "num_requests": "4001",
        "input_tokens": "288345",
        "output_tokens": "707524",
        "mean_ttft": "184.97",
        "median_ttft": "169.21",
        "p99_ttft": "466.63",
        "hit_ratios": [
            "0.01331967213114754",
            "0.0545785324439054",
            "0.05288888888888889",
            "0.053919694072657745",
            "0.053432642487046635",
            "0.05643410852713178",
            "0.11602060178910271",
            "0.18440486533449174",
            "0.21797631862217437",
            "0.24949604589858893",
            "0.25960264900662255",
            "0.28465547191661844",
            "0.2974826033565289",
            "0.313795702977761",
            "0.3224808865217765",
            "0.33468370208787784",
            "0.3270918665886483",
            "0.32725521227551085",
            "0.32123826439989844",
            "0.3202099737532808",
            "0.31932630146308266",
            "0.3187412285436683",
            "0.3182707153885743",
            "0.3178814382896015",
            "0.31820287169986095",
            "0.31391643854059137",
            "0.3082361105087391",
            "0.30426747311827945",
            "0.3058637725763343",
            "0.3005203646465041",
            "0.2939563578201759",
            "0.2842832596058933",
            "0.28095953095953097",
            "0.27270231313061977",
            "0.2663844256283752",
            "0.2616126630628297",
            "0.25586293618359013",
            "0.2526520891967958",
            "0.2525502318392581",
            "0.2525502318392581",
            "0.2525502318392581"
        ],
        "args": " --port 8000  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.0025,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 0.25,
        "result_file": "lmsys-reqrate++/client_logs/8000_lru.json"
    },
    {
        "num_requests": "5023",
        "input_tokens": "313881",
        "output_tokens": "869457",
        "mean_ttft": "169.12",
        "median_ttft": "149.78",
        "p99_ttft": "353.21",
        "hit_ratios": [
            "0.03933136676499509",
            "0.061626429479034316",
            "0.07114427860696518",
            "0.09221689413500554",
            "0.11855203619909502",
            "0.12951969778737182",
            "0.15708908406524466",
            "0.1977604056623706",
            "0.26144438935713105",
            "0.29188107489994286",
            "0.31492687846696926",
            "0.33100574389007775",
            "0.33999204929437493",
            "0.3428956834532375",
            "0.35076948264571056",
            "0.3531064864043749",
            "0.3654601861427094",
            "0.38162723016575983",
            "0.3786384837928795",
            "0.3781255220805257",
            "0.3786556666137818",
            "0.3771994314561583",
            "0.38449882914734373",
            "0.3892585551330797",
            "0.39979321753515296",
            "0.4068922886725389",
            "0.4084132249480552",
            "0.4132076779155983",
            "0.4188882207523217",
            "0.4206015472025165",
            "0.4224740263685521",
            "0.4219636363636362",
            "0.42268618286641846",
            "0.42354849863028265",
            "0.42445261141881047",
            "0.4267972712961342",
            "0.42855420524691346",
            "0.42482781394471164",
            "0.4236848688848961",
            "0.4211586019740441",
            "0.42370357765771893",
            "0.4245864350703061",
            "0.4239416932907349",
            "0.42349919617299925",
            "0.42261116548640293",
            "0.4215604975499434",
            "0.4177694456697544",
            "0.4151808820117434",
            "0.41068729126384246",
            "0.41068729126384246",
            "0.41068729126384246"
        ],
        "args": " --port 8002  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.01,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 1,
        "result_file": "lmsys-reqrate++/client_logs/8002_lru.json"
    },
    {
        "num_requests": "6758",
        "input_tokens": "406972",
        "output_tokens": "1195231",
        "mean_ttft": "182.24",
        "median_ttft": "181.97",
        "p99_ttft": "345.63",
        "hit_ratios": [
            "0.02721774193548387",
            "0.05953827460510329",
            "0.07864164432529043",
            "0.11145725164416753",
            "0.13029960429621254",
            "0.1677917068466731",
            "0.192847740236946",
            "0.21858440575321728",
            "0.22156084656084654",
            "0.22482758620689652",
            "0.24553571428571427",
            "0.2501512035805008",
            "0.27070270270270264",
            "0.27246860282574564",
            "0.2883612160460514",
            "0.30765507784141327",
            "0.3198014018691589",
            "0.32728014690879415",
            "0.3311907139291064",
            "0.34076812977099236",
            "0.3458378194593983",
            "0.35193899075125745",
            "0.3572497806225159",
            "0.3623464944468907",
            "0.366872263289232",
            "0.377835443604313",
            "0.3822623517995021",
            "0.38715693031175247",
            "0.3939032828476974",
            "0.39968176435760805",
            "0.4014918513804928",
            "0.39687468013238253",
            "0.3924652523774689",
            "0.39395592056719386",
            "0.39838759689922476",
            "0.39880539382786806",
            "0.39997665392359993",
            "0.4057579086734837",
            "0.40862120675082475",
            "0.4116487789288663",
            "0.41344741385975314",
            "0.4138580068763018",
            "0.4180604424736107",
            "0.4166529149673496",
            "0.4211274386190138",
            "0.42491941758363894",
            "0.4256359015574429",
            "0.4283267429320589",
            "0.43020196789228377",
            "0.42981064637256267",
            "0.4331901202597453",
            "0.432961320898945",
            "0.43324565821627764",
            "0.43670863047591313",
            "0.43886682552290174",
            "0.4427087818404146",
            "0.44128997617369703",
            "0.44143519664636655",
            "0.4414877238473381",
            "0.44200098586398245",
            "0.4403024799599197",
            "0.43986856177441597",
            "0.43963480128893656",
            "0.43967536687472597",
            "0.4403001708893676",
            "0.4390415475928775",
            "0.4376933854866016",
            "0.4376933854866016"
        ],
        "args": " --port 8003  --eviction_algorithm ml --max-num-batched-tokens 2048 --num-gpu-blocks-override 10000 ",
        "size": 10000,
        "num_prompts": 30000,
        "use_oracle": 0,
        "use_token_id": 0,
        "algorithm": "lru",
        "session_rate": 10,
        "request_rate": 0.02,
        "max_active_conversations": 200,
        "checkpoint": "/home/dy5/vllm/benchmarks/checkpoints_lmsys-chat-1m_20/lmsys-chat-1m_epoch11_metric_0_5797.pt",
        "dataset_file": "\"lmsys/lmsys-chat-1m\"",
        "time_limit": 1200,
        "dataset_name": "lmsys",
        "scale": 2,
        "result_file": "lmsys-reqrate++/client_logs/8003_lru.json"
    }
]