task,score,model,method
2wikimqa,44.81,Qwen1.5-14B-Chat,baseline
dureader,26.02,Qwen1.5-14B-Chat,baseline
gov_report,16.31,Qwen1.5-14B-Chat,baseline
hotpotqa,55.67,Qwen1.5-14B-Chat,baseline
lcc,56.69,Qwen1.5-14B-Chat,baseline
lsht,37,Qwen1.5-14B-Chat,baseline
multifieldqa_en,48.36,Qwen1.5-14B-Chat,baseline
multifieldqa_zh,60.35,Qwen1.5-14B-Chat,baseline
multi_news,14.95,Qwen1.5-14B-Chat,baseline
musique,32.38,Qwen1.5-14B-Chat,baseline
narrativeqa,22.26,Qwen1.5-14B-Chat,baseline
passage_count,1,Qwen1.5-14B-Chat,baseline
passage_retrieval_en,94.5,Qwen1.5-14B-Chat,baseline
passage_retrieval_zh,88.5,Qwen1.5-14B-Chat,baseline
qasper,38.93,Qwen1.5-14B-Chat,baseline
qmsum,18.16,Qwen1.5-14B-Chat,baseline
repobench-p,58.25,Qwen1.5-14B-Chat,baseline
samsum,32.95,Qwen1.5-14B-Chat,baseline
trec,77.5,Qwen1.5-14B-Chat,baseline
triviaqa,88.63,Qwen1.5-14B-Chat,baseline
vcsum,19.41,Qwen1.5-14B-Chat,baseline
2wikimqa,40.31,Qwen1.5-14B-Chat,KiVi_2_128
dureader,24.66,Qwen1.5-14B-Chat,KiVi_2_128
gov_report,15.81,Qwen1.5-14B-Chat,KiVi_2_128
hotpotqa,54.23,Qwen1.5-14B-Chat,KiVi_2_128
lcc,41.24,Qwen1.5-14B-Chat,KiVi_2_128
lsht,34,Qwen1.5-14B-Chat,KiVi_2_128
multifieldqa_en,46.25,Qwen1.5-14B-Chat,KiVi_2_128
multifieldqa_zh,58.87,Qwen1.5-14B-Chat,KiVi_2_128
multi_news,15.11,Qwen1.5-14B-Chat,KiVi_2_128
musique,30.58,Qwen1.5-14B-Chat,KiVi_2_128
narrativeqa,22.32,Qwen1.5-14B-Chat,KiVi_2_128
passage_count,2.5,Qwen1.5-14B-Chat,KiVi_2_128
passage_retrieval_en,70.5,Qwen1.5-14B-Chat,KiVi_2_128
passage_retrieval_zh,70,Qwen1.5-14B-Chat,KiVi_2_128
qasper,38.02,Qwen1.5-14B-Chat,KiVi_2_128
qmsum,17.74,Qwen1.5-14B-Chat,KiVi_2_128
repobench-p,43.45,Qwen1.5-14B-Chat,KiVi_2_128
samsum,30.79,Qwen1.5-14B-Chat,KiVi_2_128
trec,78,Qwen1.5-14B-Chat,KiVi_2_128
triviaqa,87.65,Qwen1.5-14B-Chat,KiVi_2_128
vcsum,19.34,Qwen1.5-14B-Chat,KiVi_2_128
2wikimqa,40.31,Qwen1.5-14B-Chat,KiVi_2_192
dureader,24.66,Qwen1.5-14B-Chat,KiVi_2_192
gov_report,15.9,Qwen1.5-14B-Chat,KiVi_2_192
hotpotqa,54.23,Qwen1.5-14B-Chat,KiVi_2_192
lcc,41.24,Qwen1.5-14B-Chat,KiVi_2_192
lsht,34,Qwen1.5-14B-Chat,KiVi_2_192
multifieldqa_en,46.25,Qwen1.5-14B-Chat,KiVi_2_192
multifieldqa_zh,58.87,Qwen1.5-14B-Chat,KiVi_2_192
multi_news,14.97,Qwen1.5-14B-Chat,KiVi_2_192
musique,30.58,Qwen1.5-14B-Chat,KiVi_2_192
narrativeqa,22.32,Qwen1.5-14B-Chat,KiVi_2_192
passage_count,2.5,Qwen1.5-14B-Chat,KiVi_2_192
passage_retrieval_en,70.5,Qwen1.5-14B-Chat,KiVi_2_192
passage_retrieval_zh,70,Qwen1.5-14B-Chat,KiVi_2_192
qasper,38.02,Qwen1.5-14B-Chat,KiVi_2_192
qmsum,17.73,Qwen1.5-14B-Chat,KiVi_2_192
repobench-p,43.45,Qwen1.5-14B-Chat,KiVi_2_192
samsum,30.79,Qwen1.5-14B-Chat,KiVi_2_192
trec,78,Qwen1.5-14B-Chat,KiVi_2_192
triviaqa,87.65,Qwen1.5-14B-Chat,KiVi_2_192
vcsum,19.39,Qwen1.5-14B-Chat,KiVi_2_192
2wikimqa,40.31,Qwen1.5-14B-Chat,KiVi_2_256
dureader,24.66,Qwen1.5-14B-Chat,KiVi_2_256
gov_report,15.77,Qwen1.5-14B-Chat,KiVi_2_256
hotpotqa,54.23,Qwen1.5-14B-Chat,KiVi_2_256
lcc,41.24,Qwen1.5-14B-Chat,KiVi_2_256
lsht,34,Qwen1.5-14B-Chat,KiVi_2_256
multifieldqa_en,46.25,Qwen1.5-14B-Chat,KiVi_2_256
multifieldqa_zh,58.87,Qwen1.5-14B-Chat,KiVi_2_256
multi_news,15,Qwen1.5-14B-Chat,KiVi_2_256
musique,30.58,Qwen1.5-14B-Chat,KiVi_2_256
narrativeqa,22.32,Qwen1.5-14B-Chat,KiVi_2_256
passage_count,2.5,Qwen1.5-14B-Chat,KiVi_2_256
passage_retrieval_en,70.5,Qwen1.5-14B-Chat,KiVi_2_256
passage_retrieval_zh,70,Qwen1.5-14B-Chat,KiVi_2_256
qasper,38.02,Qwen1.5-14B-Chat,KiVi_2_256
qmsum,17.73,Qwen1.5-14B-Chat,KiVi_2_256
repobench-p,43.45,Qwen1.5-14B-Chat,KiVi_2_256
samsum,30.79,Qwen1.5-14B-Chat,KiVi_2_256
trec,78,Qwen1.5-14B-Chat,KiVi_2_256
triviaqa,87.65,Qwen1.5-14B-Chat,KiVi_2_256
vcsum,19.42,Qwen1.5-14B-Chat,KiVi_2_256
2wikimqa,42.17,Qwen1.5-14B-Chat,LogQuant_2_128
dureader,24.33,Qwen1.5-14B-Chat,LogQuant_2_128
gov_report,16.08,Qwen1.5-14B-Chat,LogQuant_2_128
hotpotqa,55.46,Qwen1.5-14B-Chat,LogQuant_2_128
lcc,50.73,Qwen1.5-14B-Chat,LogQuant_2_128
lsht,35.5,Qwen1.5-14B-Chat,LogQuant_2_128
multifieldqa_en,47.04,Qwen1.5-14B-Chat,LogQuant_2_128
multifieldqa_zh,60.2,Qwen1.5-14B-Chat,LogQuant_2_128
multi_news,14.84,Qwen1.5-14B-Chat,LogQuant_2_128
musique,29.95,Qwen1.5-14B-Chat,LogQuant_2_128
narrativeqa,22.08,Qwen1.5-14B-Chat,LogQuant_2_128
passage_count,1,Qwen1.5-14B-Chat,LogQuant_2_128
passage_retrieval_en,79.5,Qwen1.5-14B-Chat,LogQuant_2_128
passage_retrieval_zh,81,Qwen1.5-14B-Chat,LogQuant_2_128
qasper,39.26,Qwen1.5-14B-Chat,LogQuant_2_128
qmsum,18.01,Qwen1.5-14B-Chat,LogQuant_2_128
repobench-p,50.93,Qwen1.5-14B-Chat,LogQuant_2_128
samsum,32.37,Qwen1.5-14B-Chat,LogQuant_2_128
trec,78.5,Qwen1.5-14B-Chat,LogQuant_2_128
triviaqa,88.97,Qwen1.5-14B-Chat,LogQuant_2_128
vcsum,19.3,Qwen1.5-14B-Chat,LogQuant_2_128
2wikimqa,42.3,Qwen1.5-14B-Chat,LogQuant_2_192
dureader,24.17,Qwen1.5-14B-Chat,LogQuant_2_192
gov_report,16.07,Qwen1.5-14B-Chat,LogQuant_2_192
hotpotqa,55.54,Qwen1.5-14B-Chat,LogQuant_2_192
lcc,50.09,Qwen1.5-14B-Chat,LogQuant_2_192
lsht,35.5,Qwen1.5-14B-Chat,LogQuant_2_192
multifieldqa_en,46.94,Qwen1.5-14B-Chat,LogQuant_2_192
multifieldqa_zh,60.09,Qwen1.5-14B-Chat,LogQuant_2_192
multi_news,15.01,Qwen1.5-14B-Chat,LogQuant_2_192
musique,29.87,Qwen1.5-14B-Chat,LogQuant_2_192
narrativeqa,22.04,Qwen1.5-14B-Chat,LogQuant_2_192
passage_count,1,Qwen1.5-14B-Chat,LogQuant_2_192
passage_retrieval_en,81,Qwen1.5-14B-Chat,LogQuant_2_192
passage_retrieval_zh,80,Qwen1.5-14B-Chat,LogQuant_2_192
qasper,39.49,Qwen1.5-14B-Chat,LogQuant_2_192
qmsum,18.04,Qwen1.5-14B-Chat,LogQuant_2_192
repobench-p,52.07,Qwen1.5-14B-Chat,LogQuant_2_192
samsum,32.57,Qwen1.5-14B-Chat,LogQuant_2_192
trec,78.5,Qwen1.5-14B-Chat,LogQuant_2_192
triviaqa,89.14,Qwen1.5-14B-Chat,LogQuant_2_192
vcsum,19.42,Qwen1.5-14B-Chat,LogQuant_2_192
2wikimqa,42.17,Qwen1.5-14B-Chat,LogQuant_2_256
dureader,24,Qwen1.5-14B-Chat,LogQuant_2_256
gov_report,16,Qwen1.5-14B-Chat,LogQuant_2_256
hotpotqa,55.56,Qwen1.5-14B-Chat,LogQuant_2_256
lcc,49.45,Qwen1.5-14B-Chat,LogQuant_2_256
lsht,36,Qwen1.5-14B-Chat,LogQuant_2_256
multifieldqa_en,46.72,Qwen1.5-14B-Chat,LogQuant_2_256
multifieldqa_zh,60.63,Qwen1.5-14B-Chat,LogQuant_2_256
multi_news,14.93,Qwen1.5-14B-Chat,LogQuant_2_256
musique,29.26,Qwen1.5-14B-Chat,LogQuant_2_256
narrativeqa,22.08,Qwen1.5-14B-Chat,LogQuant_2_256
passage_count,2,Qwen1.5-14B-Chat,LogQuant_2_256
passage_retrieval_en,78.5,Qwen1.5-14B-Chat,LogQuant_2_256
passage_retrieval_zh,81.5,Qwen1.5-14B-Chat,LogQuant_2_256
qasper,39,Qwen1.5-14B-Chat,LogQuant_2_256
qmsum,18.11,Qwen1.5-14B-Chat,LogQuant_2_256
repobench-p,52.28,Qwen1.5-14B-Chat,LogQuant_2_256
samsum,32.48,Qwen1.5-14B-Chat,LogQuant_2_256
trec,78.5,Qwen1.5-14B-Chat,LogQuant_2_256
triviaqa,89.14,Qwen1.5-14B-Chat,LogQuant_2_256
vcsum,19.17,Qwen1.5-14B-Chat,LogQuant_2_256
2wikimqa,42.28,Qwen1.5-14B-Chat,PartialLogQuant_2_128
dureader,24.63,Qwen1.5-14B-Chat,PartialLogQuant_2_128
gov_report,16.01,Qwen1.5-14B-Chat,PartialLogQuant_2_128
hotpotqa,55.72,Qwen1.5-14B-Chat,PartialLogQuant_2_128
lcc,50.21,Qwen1.5-14B-Chat,PartialLogQuant_2_128
lsht,35.5,Qwen1.5-14B-Chat,PartialLogQuant_2_128
multifieldqa_en,47.16,Qwen1.5-14B-Chat,PartialLogQuant_2_128
multifieldqa_zh,60.08,Qwen1.5-14B-Chat,PartialLogQuant_2_128
multi_news,14.82,Qwen1.5-14B-Chat,PartialLogQuant_2_128
musique,30.22,Qwen1.5-14B-Chat,PartialLogQuant_2_128
narrativeqa,21.92,Qwen1.5-14B-Chat,PartialLogQuant_2_128
passage_count,1.5,Qwen1.5-14B-Chat,PartialLogQuant_2_128
passage_retrieval_en,80.5,Qwen1.5-14B-Chat,PartialLogQuant_2_128
passage_retrieval_zh,80.5,Qwen1.5-14B-Chat,PartialLogQuant_2_128
qasper,39.5,Qwen1.5-14B-Chat,PartialLogQuant_2_128
qmsum,18.31,Qwen1.5-14B-Chat,PartialLogQuant_2_128
repobench-p,51.84,Qwen1.5-14B-Chat,PartialLogQuant_2_128
samsum,32.71,Qwen1.5-14B-Chat,PartialLogQuant_2_128
trec,78.5,Qwen1.5-14B-Chat,PartialLogQuant_2_128
triviaqa,89.14,Qwen1.5-14B-Chat,PartialLogQuant_2_128
vcsum,19.23,Qwen1.5-14B-Chat,PartialLogQuant_2_128
2wikimqa,42.17,Qwen1.5-14B-Chat,PartialLogQuant_2_192
dureader,24.41,Qwen1.5-14B-Chat,PartialLogQuant_2_192
gov_report,15.98,Qwen1.5-14B-Chat,PartialLogQuant_2_192
hotpotqa,55.57,Qwen1.5-14B-Chat,PartialLogQuant_2_192
lcc,50.13,Qwen1.5-14B-Chat,PartialLogQuant_2_192
lsht,35.5,Qwen1.5-14B-Chat,PartialLogQuant_2_192
multifieldqa_en,46.52,Qwen1.5-14B-Chat,PartialLogQuant_2_192
multifieldqa_zh,60.4,Qwen1.5-14B-Chat,PartialLogQuant_2_192
multi_news,14.8,Qwen1.5-14B-Chat,PartialLogQuant_2_192
musique,30.36,Qwen1.5-14B-Chat,PartialLogQuant_2_192
narrativeqa,21.87,Qwen1.5-14B-Chat,PartialLogQuant_2_192
passage_count,1.5,Qwen1.5-14B-Chat,PartialLogQuant_2_192
passage_retrieval_en,81.5,Qwen1.5-14B-Chat,PartialLogQuant_2_192
passage_retrieval_zh,80.5,Qwen1.5-14B-Chat,PartialLogQuant_2_192
qasper,39.41,Qwen1.5-14B-Chat,PartialLogQuant_2_192
qmsum,17.78,Qwen1.5-14B-Chat,PartialLogQuant_2_192
repobench-p,52.61,Qwen1.5-14B-Chat,PartialLogQuant_2_192
samsum,32.31,Qwen1.5-14B-Chat,PartialLogQuant_2_192
trec,78.5,Qwen1.5-14B-Chat,PartialLogQuant_2_192
triviaqa,89.14,Qwen1.5-14B-Chat,PartialLogQuant_2_192
vcsum,19.4,Qwen1.5-14B-Chat,PartialLogQuant_2_192
2wikimqa,42.28,Qwen1.5-14B-Chat,PartialLogQuant_2_256
dureader,24.45,Qwen1.5-14B-Chat,PartialLogQuant_2_256
gov_report,15.92,Qwen1.5-14B-Chat,PartialLogQuant_2_256
hotpotqa,55.03,Qwen1.5-14B-Chat,PartialLogQuant_2_256
lcc,50.28,Qwen1.5-14B-Chat,PartialLogQuant_2_256
lsht,35.5,Qwen1.5-14B-Chat,PartialLogQuant_2_256
multifieldqa_en,47.18,Qwen1.5-14B-Chat,PartialLogQuant_2_256
multifieldqa_zh,60.31,Qwen1.5-14B-Chat,PartialLogQuant_2_256
multi_news,14.84,Qwen1.5-14B-Chat,PartialLogQuant_2_256
musique,30.15,Qwen1.5-14B-Chat,PartialLogQuant_2_256
narrativeqa,21.94,Qwen1.5-14B-Chat,PartialLogQuant_2_256
passage_count,1.5,Qwen1.5-14B-Chat,PartialLogQuant_2_256
passage_retrieval_en,83,Qwen1.5-14B-Chat,PartialLogQuant_2_256
passage_retrieval_zh,82.5,Qwen1.5-14B-Chat,PartialLogQuant_2_256
qasper,39.76,Qwen1.5-14B-Chat,PartialLogQuant_2_256
qmsum,18.19,Qwen1.5-14B-Chat,PartialLogQuant_2_256
repobench-p,52.92,Qwen1.5-14B-Chat,PartialLogQuant_2_256
samsum,32.2,Qwen1.5-14B-Chat,PartialLogQuant_2_256
trec,78.5,Qwen1.5-14B-Chat,PartialLogQuant_2_256
triviaqa,89.14,Qwen1.5-14B-Chat,PartialLogQuant_2_256
vcsum,19.42,Qwen1.5-14B-Chat,PartialLogQuant_2_256
