task,score,model,method
2wikimqa,32.43,Qwen1.5-7B-Chat-AWQ,baseline
dureader,25.84,Qwen1.5-7B-Chat-AWQ,baseline
gov_report,16.98,Qwen1.5-7B-Chat-AWQ,baseline
hotpotqa,47.77,Qwen1.5-7B-Chat-AWQ,baseline
lcc,57.98,Qwen1.5-7B-Chat-AWQ,baseline
lsht,29,Qwen1.5-7B-Chat-AWQ,baseline
multifieldqa_en,46.72,Qwen1.5-7B-Chat-AWQ,baseline
multifieldqa_zh,50.97,Qwen1.5-7B-Chat-AWQ,baseline
multi_news,14.97,Qwen1.5-7B-Chat-AWQ,baseline
musique,26.18,Qwen1.5-7B-Chat-AWQ,baseline
narrativeqa,20.93,Qwen1.5-7B-Chat-AWQ,baseline
passage_count,0.5,Qwen1.5-7B-Chat-AWQ,baseline
passage_retrieval_en,30.5,Qwen1.5-7B-Chat-AWQ,baseline
passage_retrieval_zh,48.5,Qwen1.5-7B-Chat-AWQ,baseline
qasper,38.45,Qwen1.5-7B-Chat-AWQ,baseline
qmsum,17.85,Qwen1.5-7B-Chat-AWQ,baseline
repobench-p,46.95,Qwen1.5-7B-Chat-AWQ,baseline
samsum,31.98,Qwen1.5-7B-Chat-AWQ,baseline
trec,67,Qwen1.5-7B-Chat-AWQ,baseline
triviaqa,87.56,Qwen1.5-7B-Chat-AWQ,baseline
vcsum,18.66,Qwen1.5-7B-Chat-AWQ,baseline
2wikimqa,30.82,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
dureader,23.1,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
gov_report,16.31,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
hotpotqa,47.17,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
lcc,44.56,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
lsht,25.5,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
multifieldqa_en,42.87,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
multifieldqa_zh,45.51,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
multi_news,15.04,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
musique,23.23,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
narrativeqa,19.58,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
passage_count,0,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
passage_retrieval_en,16,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
passage_retrieval_zh,14,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
qasper,35.27,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
qmsum,17.34,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
repobench-p,25.02,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
samsum,28.3,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
trec,65,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
triviaqa,86.48,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
vcsum,19.95,Qwen1.5-7B-Chat-AWQ,KiVi_2_128
2wikimqa,30.82,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
dureader,23.1,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
gov_report,16.3,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
hotpotqa,47.17,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
lcc,44.56,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
lsht,25.5,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
multifieldqa_en,42.87,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
multifieldqa_zh,45.51,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
multi_news,15.2,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
musique,23.23,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
narrativeqa,19.58,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
passage_count,0,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
passage_retrieval_en,16,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
passage_retrieval_zh,14,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
qasper,35.27,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
qmsum,17.33,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
repobench-p,25.02,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
samsum,28.3,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
trec,65,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
triviaqa,86.48,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
vcsum,19.97,Qwen1.5-7B-Chat-AWQ,KiVi_2_192
2wikimqa,30.82,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
dureader,23.1,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
gov_report,16.31,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
hotpotqa,47.17,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
lcc,44.56,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
lsht,25.5,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
multifieldqa_en,42.87,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
multifieldqa_zh,45.51,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
multi_news,15.08,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
musique,23.23,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
narrativeqa,19.58,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
passage_count,0,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
passage_retrieval_en,16,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
passage_retrieval_zh,14,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
qasper,35.27,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
qmsum,17.33,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
repobench-p,25.02,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
samsum,28.3,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
trec,65,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
triviaqa,86.48,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
vcsum,19.97,Qwen1.5-7B-Chat-AWQ,KiVi_2_256
2wikimqa,33.46,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
dureader,24.36,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
gov_report,16.65,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
hotpotqa,46,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
lcc,52.33,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
lsht,27,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
multifieldqa_en,45.85,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
multifieldqa_zh,46.73,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
multi_news,15.16,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
musique,24.36,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
narrativeqa,20.14,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
passage_count,0,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
passage_retrieval_en,18.5,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
passage_retrieval_zh,22,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
qasper,36.16,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
qmsum,17.77,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
repobench-p,29.03,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
samsum,32.06,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
trec,63.5,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
triviaqa,87.61,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
vcsum,19.96,Qwen1.5-7B-Chat-AWQ,LogQuant_2_128
2wikimqa,33.41,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
dureader,24.09,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
gov_report,16.53,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
hotpotqa,45.48,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
lcc,53.43,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
lsht,27.5,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
multifieldqa_en,45.94,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
multifieldqa_zh,47.29,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
multi_news,15.01,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
musique,23.73,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
narrativeqa,20.18,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
passage_count,0,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
passage_retrieval_en,17.5,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
passage_retrieval_zh,24.5,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
qasper,36.33,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
qmsum,17.76,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
repobench-p,30.33,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
samsum,32.34,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
trec,63.5,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
triviaqa,87.81,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
vcsum,19.98,Qwen1.5-7B-Chat-AWQ,LogQuant_2_192
2wikimqa,33.39,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
dureader,24.3,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
gov_report,16.66,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
hotpotqa,45.26,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
lcc,54.24,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
lsht,27,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
multifieldqa_en,45.6,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
multifieldqa_zh,46.97,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
multi_news,14.94,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
musique,23.89,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
narrativeqa,20.36,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
passage_count,0,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
passage_retrieval_en,18,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
passage_retrieval_zh,24.5,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
qasper,36.31,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
qmsum,17.75,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
repobench-p,29.9,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
samsum,32.42,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
trec,63,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
triviaqa,87.88,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
vcsum,19.95,Qwen1.5-7B-Chat-AWQ,LogQuant_2_256
2wikimqa,32.94,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
dureader,24.06,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
gov_report,16.7,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
hotpotqa,46.33,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
lcc,54.32,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
lsht,27,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
multifieldqa_en,45.93,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
multifieldqa_zh,47.13,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
multi_news,15.08,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
musique,23.9,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
narrativeqa,19.94,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
passage_count,0,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
passage_retrieval_en,17,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
passage_retrieval_zh,24,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
qasper,36.2,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
qmsum,17.58,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
repobench-p,31.91,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
samsum,31.39,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
trec,64,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
triviaqa,87.48,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
vcsum,19.91,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_128
2wikimqa,33.44,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
dureader,24.7,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
gov_report,16.63,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
hotpotqa,45.11,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
lcc,53.65,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
lsht,27,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
multifieldqa_en,45.64,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
multifieldqa_zh,46.61,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
multi_news,15.16,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
musique,23.79,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
narrativeqa,19.85,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
passage_count,0,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
passage_retrieval_en,20,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
passage_retrieval_zh,23,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
qasper,36.57,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
qmsum,17.49,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
repobench-p,31.81,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
samsum,31.81,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
trec,63.5,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
triviaqa,87.48,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
vcsum,19.89,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_192
2wikimqa,33.4,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
dureader,24.12,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
gov_report,16.68,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
hotpotqa,45.83,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
lcc,54.23,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
lsht,27.5,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
multifieldqa_en,46.24,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
multifieldqa_zh,46.92,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
multi_news,15.04,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
musique,23.89,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
narrativeqa,19.84,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
passage_count,0,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
passage_retrieval_en,19,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
passage_retrieval_zh,26.5,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
qasper,36.71,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
qmsum,17.67,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
repobench-p,34.31,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
samsum,32.2,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
trec,64,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
triviaqa,87.39,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
vcsum,19.97,Qwen1.5-7B-Chat-AWQ,PartialLogQuant_2_256
