{"meta-llama/Llama-2-7b-chat-hf": {"original": 6.9423699378967285, "qbit-16-heavy-2048-group-1-qk": 6.9423699378967285, "qbit-8-heavy-2048-group-1-qk": 6.9423699378967285, "qbit-4-heavy-2048-group-1-qk": 6.9423699378967285, "qbit-4-heavy-2048-group-2-qk": 6.9423699378967285, "qbit-4-heavy-2048-group-4-qk": 6.9423699378967285, "qbit-4-heavy-2048-group-8-qk": 6.9423699378967285, "qbit-4-heavy-2048-group-16-qk": 6.9423699378967285, "qbit-4-heavy-2048-group-32-qk": 6.9423699378967285, "qbit-16-heavy-1024-group-1-qk": 6.9394707679748535, "qbit-8-heavy-1024-group-1-qk": 6.939413070678711, "qbit-4-heavy-1024-group-1-qk": 6.938732147216797, "qbit-4-heavy-1024-group-2-qk": 6.934878826141357, "qbit-4-heavy-1024-group-4-qk": 6.934546947479248, "qbit-4-heavy-1024-group-8-qk": 6.962414741516113, "qbit-4-heavy-1024-group-16-qk": NaN, "qbit-4-heavy-1024-group-32-qk": 8.262508392333984, "qbit-16-heavy-512-group-1-qk": 6.9667067527771, "qbit-8-heavy-512-group-1-qk": 6.966775417327881, "qbit-4-heavy-512-group-1-qk": 6.964434623718262, "qbit-4-heavy-512-group-2-qk": 6.913018226623535, "qbit-4-heavy-512-group-4-qk": 6.919395923614502, "qbit-4-heavy-512-group-8-qk": 7.093745708465576, "qbit-4-heavy-512-group-16-qk": NaN, "qbit-4-heavy-512-group-32-qk": NaN, "qbit-16-heavy-256-group-1-qk": 7.194601058959961, "qbit-8-heavy-256-group-1-qk": 7.194504737854004, "qbit-4-heavy-256-group-1-qk": 7.193200588226318, "qbit-4-heavy-256-group-2-qk": 6.919350624084473, "qbit-4-heavy-256-group-4-qk": 6.980145454406738, "qbit-4-heavy-256-group-8-qk": 7.566158294677734, "qbit-4-heavy-256-group-16-qk": NaN, "qbit-4-heavy-256-group-32-qk": NaN, "qbit-16-heavy-128-group-1-qk": 8.334566116333008, "qbit-8-heavy-128-group-1-qk": 8.335561752319336, "qbit-4-heavy-128-group-1-qk": 8.33909797668457, "qbit-4-heavy-128-group-2-qk": 7.022818565368652, "qbit-4-heavy-128-group-4-qk": 7.144011497497559, "qbit-4-heavy-128-group-8-qk": 8.889999389648438, "qbit-4-heavy-128-group-16-qk": NaN, "qbit-4-heavy-128-group-32-qk": NaN, "qbit-16-heavy-64-group-1-qk": 11.920303344726562, "qbit-8-heavy-64-group-1-qk": 11.920411109924316, "qbit-4-heavy-64-group-1-qk": 11.959208488464355, "qbit-4-heavy-64-group-2-qk": 7.692116737365723, "qbit-4-heavy-64-group-4-qk": 8.11898136138916, "qbit-4-heavy-64-group-8-qk": 14.934636116027832, "qbit-4-heavy-64-group-16-qk": NaN, "qbit-4-heavy-64-group-32-qk": NaN, "qbit-16-heavy-32-group-1-qk": 40.48686599731445, "qbit-8-heavy-32-group-1-qk": 40.467159271240234, "qbit-4-heavy-32-group-1-qk": 40.79131317138672, "qbit-4-heavy-32-group-2-qk": 8.623040199279785, "qbit-4-heavy-32-group-4-qk": 11.947843551635742, "qbit-4-heavy-32-group-8-qk": 57.14908218383789, "qbit-4-heavy-32-group-16-qk": NaN, "qbit-4-heavy-32-group-32-qk": NaN, "qbit-16-heavy-16-group-1-qk": 444.2059020996094, "qbit-8-heavy-16-group-1-qk": 445.8756103515625, "qbit-4-heavy-16-group-1-qk": 423.16510009765625, "qbit-4-heavy-16-group-2-qk": 10.453869819641113, "qbit-4-heavy-16-group-4-qk": 42.02849197387695, "qbit-4-heavy-16-group-8-qk": 655.7816772460938, "qbit-4-heavy-16-group-16-qk": NaN, "qbit-4-heavy-16-group-32-qk": NaN}, "meta-llama/Llama-2-7b-hf": {"original": 5.472101211547852, "qbit-16-heavy-2048-group-1-qk": 5.472101211547852, "qbit-8-heavy-2048-group-1-qk": 5.472101211547852, "qbit-4-heavy-2048-group-1-qk": 5.472101211547852, "qbit-4-heavy-2048-group-2-qk": 5.472101211547852, "qbit-4-heavy-2048-group-4-qk": 5.472101211547852, "qbit-4-heavy-2048-group-8-qk": 5.472101211547852, "qbit-4-heavy-2048-group-16-qk": 5.472101211547852, "qbit-4-heavy-2048-group-32-qk": 5.472101211547852, "qbit-16-heavy-1024-group-1-qk": 5.476795673370361, "qbit-8-heavy-1024-group-1-qk": 5.47688102722168, "qbit-4-heavy-1024-group-1-qk": 5.4766845703125, "qbit-4-heavy-1024-group-2-qk": 5.475284099578857, "qbit-4-heavy-1024-group-4-qk": 5.474892616271973, "qbit-4-heavy-1024-group-8-qk": 5.4919915199279785, "qbit-4-heavy-1024-group-16-qk": 5.781702041625977, "qbit-4-heavy-1024-group-32-qk": 6.405287742614746, "qbit-16-heavy-512-group-1-qk": 5.531502723693848, "qbit-8-heavy-512-group-1-qk": 5.5313825607299805, "qbit-4-heavy-512-group-1-qk": 5.531477928161621, "qbit-4-heavy-512-group-2-qk": 5.500298023223877, "qbit-4-heavy-512-group-4-qk": 5.502518177032471, "qbit-4-heavy-512-group-8-qk": 5.637580394744873, "qbit-4-heavy-512-group-16-qk": NaN, "qbit-4-heavy-512-group-32-qk": NaN, "qbit-16-heavy-256-group-1-qk": 5.6699371337890625, "qbit-8-heavy-256-group-1-qk": 5.669694900512695, "qbit-4-heavy-256-group-1-qk": 5.67064905166626, "qbit-4-heavy-256-group-2-qk": 5.563470840454102, "qbit-4-heavy-256-group-4-qk": 5.600241184234619, "qbit-4-heavy-256-group-8-qk": 6.085517406463623, "qbit-4-heavy-256-group-16-qk": NaN, "qbit-4-heavy-256-group-32-qk": NaN, "qbit-16-heavy-128-group-1-qk": 6.3136982917785645, "qbit-8-heavy-128-group-1-qk": 6.313942909240723, "qbit-4-heavy-128-group-1-qk": 6.314574241638184, "qbit-4-heavy-128-group-2-qk": 5.7002105712890625, "qbit-4-heavy-128-group-4-qk": 5.760659694671631, "qbit-4-heavy-128-group-8-qk": 7.278022289276123, "qbit-4-heavy-128-group-16-qk": NaN, "qbit-4-heavy-128-group-32-qk": NaN, "qbit-16-heavy-64-group-1-qk": 8.987100601196289, "qbit-8-heavy-64-group-1-qk": 8.986494064331055, "qbit-4-heavy-64-group-1-qk": 9.023778915405273, "qbit-4-heavy-64-group-2-qk": 6.181826114654541, "qbit-4-heavy-64-group-4-qk": 6.306554794311523, "qbit-4-heavy-64-group-8-qk": 12.007704734802246, "qbit-4-heavy-64-group-16-qk": NaN, "qbit-4-heavy-64-group-32-qk": NaN, "qbit-16-heavy-32-group-1-qk": 36.77484893798828, "qbit-8-heavy-32-group-1-qk": 36.74520492553711, "qbit-4-heavy-32-group-1-qk": 36.21088409423828, "qbit-4-heavy-32-group-2-qk": 6.922602653503418, "qbit-4-heavy-32-group-4-qk": 8.510836601257324, "qbit-4-heavy-32-group-8-qk": 49.451229095458984, "qbit-4-heavy-32-group-16-qk": NaN, "qbit-4-heavy-32-group-32-qk": NaN, "qbit-16-heavy-16-group-1-qk": 595.1775512695312, "qbit-8-heavy-16-group-1-qk": 591.9359741210938, "qbit-4-heavy-16-group-1-qk": 538.2896728515625, "qbit-4-heavy-16-group-2-qk": 7.7085185050964355, "qbit-4-heavy-16-group-4-qk": 28.65460777282715, "qbit-4-heavy-16-group-8-qk": 478.9056091308594, "qbit-4-heavy-16-group-16-qk": NaN, "qbit-4-heavy-16-group-32-qk": NaN}}