task,score,model,method
2wikimqa,32.8,Qwen1.5-7B-Chat,baseline
dureader,25.96,Qwen1.5-7B-Chat,baseline
gov_report,16.66,Qwen1.5-7B-Chat,baseline
hotpotqa,48.11,Qwen1.5-7B-Chat,baseline
lcc,58.17,Qwen1.5-7B-Chat,baseline
lsht,28,Qwen1.5-7B-Chat,baseline
multifieldqa_en,47.14,Qwen1.5-7B-Chat,baseline
multifieldqa_zh,53.4,Qwen1.5-7B-Chat,baseline
multi_news,15.02,Qwen1.5-7B-Chat,baseline
musique,26.74,Qwen1.5-7B-Chat,baseline
narrativeqa,20.06,Qwen1.5-7B-Chat,baseline
passage_count,1,Qwen1.5-7B-Chat,baseline
passage_retrieval_en,40.5,Qwen1.5-7B-Chat,baseline
passage_retrieval_zh,59,Qwen1.5-7B-Chat,baseline
qasper,39.84,Qwen1.5-7B-Chat,baseline
qmsum,18.25,Qwen1.5-7B-Chat,baseline
repobench-p,45.46,Qwen1.5-7B-Chat,baseline
samsum,33.01,Qwen1.5-7B-Chat,baseline
trec,70.5,Qwen1.5-7B-Chat,baseline
triviaqa,86.76,Qwen1.5-7B-Chat,baseline
vcsum,17.98,Qwen1.5-7B-Chat,baseline
2wikimqa,31.83,Qwen1.5-7B-Chat,KiVi_2_128
dureader,22.64,Qwen1.5-7B-Chat,KiVi_2_128
gov_report,15.57,Qwen1.5-7B-Chat,KiVi_2_128
hotpotqa,47.37,Qwen1.5-7B-Chat,KiVi_2_128
lcc,45.87,Qwen1.5-7B-Chat,KiVi_2_128
lsht,24,Qwen1.5-7B-Chat,KiVi_2_128
multifieldqa_en,42.26,Qwen1.5-7B-Chat,KiVi_2_128
multifieldqa_zh,50.18,Qwen1.5-7B-Chat,KiVi_2_128
multi_news,15,Qwen1.5-7B-Chat,KiVi_2_128
musique,25.88,Qwen1.5-7B-Chat,KiVi_2_128
narrativeqa,19.02,Qwen1.5-7B-Chat,KiVi_2_128
passage_count,0.5,Qwen1.5-7B-Chat,KiVi_2_128
passage_retrieval_en,20,Qwen1.5-7B-Chat,KiVi_2_128
passage_retrieval_zh,18.25,Qwen1.5-7B-Chat,KiVi_2_128
qasper,37.19,Qwen1.5-7B-Chat,KiVi_2_128
qmsum,17.59,Qwen1.5-7B-Chat,KiVi_2_128
repobench-p,26.33,Qwen1.5-7B-Chat,KiVi_2_128
samsum,29.7,Qwen1.5-7B-Chat,KiVi_2_128
trec,69.5,Qwen1.5-7B-Chat,KiVi_2_128
triviaqa,86.51,Qwen1.5-7B-Chat,KiVi_2_128
vcsum,19.15,Qwen1.5-7B-Chat,KiVi_2_128
2wikimqa,31.83,Qwen1.5-7B-Chat,KiVi_2_192
dureader,22.64,Qwen1.5-7B-Chat,KiVi_2_192
gov_report,15.53,Qwen1.5-7B-Chat,KiVi_2_192
hotpotqa,47.37,Qwen1.5-7B-Chat,KiVi_2_192
lcc,45.87,Qwen1.5-7B-Chat,KiVi_2_192
lsht,24,Qwen1.5-7B-Chat,KiVi_2_192
multifieldqa_en,42.26,Qwen1.5-7B-Chat,KiVi_2_192
multifieldqa_zh,50.18,Qwen1.5-7B-Chat,KiVi_2_192
multi_news,15.01,Qwen1.5-7B-Chat,KiVi_2_192
musique,25.88,Qwen1.5-7B-Chat,KiVi_2_192
narrativeqa,19.02,Qwen1.5-7B-Chat,KiVi_2_192
passage_count,0.5,Qwen1.5-7B-Chat,KiVi_2_192
passage_retrieval_en,20,Qwen1.5-7B-Chat,KiVi_2_192
passage_retrieval_zh,18.25,Qwen1.5-7B-Chat,KiVi_2_192
qasper,37.19,Qwen1.5-7B-Chat,KiVi_2_192
qmsum,17.53,Qwen1.5-7B-Chat,KiVi_2_192
repobench-p,26.33,Qwen1.5-7B-Chat,KiVi_2_192
samsum,29.7,Qwen1.5-7B-Chat,KiVi_2_192
trec,69.5,Qwen1.5-7B-Chat,KiVi_2_192
triviaqa,86.51,Qwen1.5-7B-Chat,KiVi_2_192
vcsum,19.05,Qwen1.5-7B-Chat,KiVi_2_192
2wikimqa,31.83,Qwen1.5-7B-Chat,KiVi_2_256
dureader,22.64,Qwen1.5-7B-Chat,KiVi_2_256
gov_report,15.55,Qwen1.5-7B-Chat,KiVi_2_256
hotpotqa,47.37,Qwen1.5-7B-Chat,KiVi_2_256
lcc,45.87,Qwen1.5-7B-Chat,KiVi_2_256
lsht,24,Qwen1.5-7B-Chat,KiVi_2_256
multifieldqa_en,42.26,Qwen1.5-7B-Chat,KiVi_2_256
multifieldqa_zh,50.18,Qwen1.5-7B-Chat,KiVi_2_256
multi_news,15.01,Qwen1.5-7B-Chat,KiVi_2_256
musique,25.88,Qwen1.5-7B-Chat,KiVi_2_256
narrativeqa,19.02,Qwen1.5-7B-Chat,KiVi_2_256
passage_count,0.5,Qwen1.5-7B-Chat,KiVi_2_256
passage_retrieval_en,20,Qwen1.5-7B-Chat,KiVi_2_256
passage_retrieval_zh,18.25,Qwen1.5-7B-Chat,KiVi_2_256
qasper,37.19,Qwen1.5-7B-Chat,KiVi_2_256
qmsum,17.53,Qwen1.5-7B-Chat,KiVi_2_256
repobench-p,26.33,Qwen1.5-7B-Chat,KiVi_2_256
samsum,29.7,Qwen1.5-7B-Chat,KiVi_2_256
trec,69.5,Qwen1.5-7B-Chat,KiVi_2_256
triviaqa,86.51,Qwen1.5-7B-Chat,KiVi_2_256
vcsum,19.05,Qwen1.5-7B-Chat,KiVi_2_256
2wikimqa,32.14,Qwen1.5-7B-Chat,LogQuant_2_128
dureader,24.06,Qwen1.5-7B-Chat,LogQuant_2_128
gov_report,15.84,Qwen1.5-7B-Chat,LogQuant_2_128
hotpotqa,48.91,Qwen1.5-7B-Chat,LogQuant_2_128
lcc,53.77,Qwen1.5-7B-Chat,LogQuant_2_128
lsht,24.5,Qwen1.5-7B-Chat,LogQuant_2_128
multifieldqa_en,43.72,Qwen1.5-7B-Chat,LogQuant_2_128
multifieldqa_zh,51.68,Qwen1.5-7B-Chat,LogQuant_2_128
multi_news,14.92,Qwen1.5-7B-Chat,LogQuant_2_128
musique,27.09,Qwen1.5-7B-Chat,LogQuant_2_128
narrativeqa,20.06,Qwen1.5-7B-Chat,LogQuant_2_128
passage_count,0,Qwen1.5-7B-Chat,LogQuant_2_128
passage_retrieval_en,24,Qwen1.5-7B-Chat,LogQuant_2_128
passage_retrieval_zh,29,Qwen1.5-7B-Chat,LogQuant_2_128
qasper,37.28,Qwen1.5-7B-Chat,LogQuant_2_128
qmsum,18.18,Qwen1.5-7B-Chat,LogQuant_2_128
repobench-p,30.76,Qwen1.5-7B-Chat,LogQuant_2_128
samsum,33.31,Qwen1.5-7B-Chat,LogQuant_2_128
trec,67.5,Qwen1.5-7B-Chat,LogQuant_2_128
triviaqa,87.37,Qwen1.5-7B-Chat,LogQuant_2_128
vcsum,19.34,Qwen1.5-7B-Chat,LogQuant_2_128
2wikimqa,32.21,Qwen1.5-7B-Chat,LogQuant_2_192
dureader,23.71,Qwen1.5-7B-Chat,LogQuant_2_192
gov_report,16.04,Qwen1.5-7B-Chat,LogQuant_2_192
hotpotqa,48.71,Qwen1.5-7B-Chat,LogQuant_2_192
lcc,54.69,Qwen1.5-7B-Chat,LogQuant_2_192
lsht,24.5,Qwen1.5-7B-Chat,LogQuant_2_192
multifieldqa_en,43.94,Qwen1.5-7B-Chat,LogQuant_2_192
multifieldqa_zh,51.23,Qwen1.5-7B-Chat,LogQuant_2_192
multi_news,14.73,Qwen1.5-7B-Chat,LogQuant_2_192
musique,26,Qwen1.5-7B-Chat,LogQuant_2_192
narrativeqa,20.49,Qwen1.5-7B-Chat,LogQuant_2_192
passage_count,0.5,Qwen1.5-7B-Chat,LogQuant_2_192
passage_retrieval_en,24,Qwen1.5-7B-Chat,LogQuant_2_192
passage_retrieval_zh,28,Qwen1.5-7B-Chat,LogQuant_2_192
qasper,37.22,Qwen1.5-7B-Chat,LogQuant_2_192
qmsum,18.11,Qwen1.5-7B-Chat,LogQuant_2_192
repobench-p,31.94,Qwen1.5-7B-Chat,LogQuant_2_192
samsum,33.4,Qwen1.5-7B-Chat,LogQuant_2_192
trec,68,Qwen1.5-7B-Chat,LogQuant_2_192
triviaqa,87.24,Qwen1.5-7B-Chat,LogQuant_2_192
vcsum,19.32,Qwen1.5-7B-Chat,LogQuant_2_192
2wikimqa,32.44,Qwen1.5-7B-Chat,LogQuant_2_256
dureader,23.39,Qwen1.5-7B-Chat,LogQuant_2_256
gov_report,16.02,Qwen1.5-7B-Chat,LogQuant_2_256
hotpotqa,48.97,Qwen1.5-7B-Chat,LogQuant_2_256
lcc,53.66,Qwen1.5-7B-Chat,LogQuant_2_256
lsht,25.5,Qwen1.5-7B-Chat,LogQuant_2_256
multifieldqa_en,44.11,Qwen1.5-7B-Chat,LogQuant_2_256
multifieldqa_zh,51.59,Qwen1.5-7B-Chat,LogQuant_2_256
multi_news,14.86,Qwen1.5-7B-Chat,LogQuant_2_256
musique,26.37,Qwen1.5-7B-Chat,LogQuant_2_256
narrativeqa,20.37,Qwen1.5-7B-Chat,LogQuant_2_256
passage_count,0.5,Qwen1.5-7B-Chat,LogQuant_2_256
passage_retrieval_en,25,Qwen1.5-7B-Chat,LogQuant_2_256
passage_retrieval_zh,26,Qwen1.5-7B-Chat,LogQuant_2_256
qasper,36.67,Qwen1.5-7B-Chat,LogQuant_2_256
qmsum,17.77,Qwen1.5-7B-Chat,LogQuant_2_256
repobench-p,31.96,Qwen1.5-7B-Chat,LogQuant_2_256
samsum,33.1,Qwen1.5-7B-Chat,LogQuant_2_256
trec,68,Qwen1.5-7B-Chat,LogQuant_2_256
triviaqa,87.32,Qwen1.5-7B-Chat,LogQuant_2_256
vcsum,19.31,Qwen1.5-7B-Chat,LogQuant_2_256
2wikimqa,32.53,Qwen1.5-7B-Chat,PartialLogQuant_2_128
dureader,23.72,Qwen1.5-7B-Chat,PartialLogQuant_2_128
gov_report,15.83,Qwen1.5-7B-Chat,PartialLogQuant_2_128
hotpotqa,48.11,Qwen1.5-7B-Chat,PartialLogQuant_2_128
lcc,53.93,Qwen1.5-7B-Chat,PartialLogQuant_2_128
lsht,25,Qwen1.5-7B-Chat,PartialLogQuant_2_128
multifieldqa_en,44.08,Qwen1.5-7B-Chat,PartialLogQuant_2_128
multifieldqa_zh,51.13,Qwen1.5-7B-Chat,PartialLogQuant_2_128
multi_news,14.83,Qwen1.5-7B-Chat,PartialLogQuant_2_128
musique,26.33,Qwen1.5-7B-Chat,PartialLogQuant_2_128
narrativeqa,20.5,Qwen1.5-7B-Chat,PartialLogQuant_2_128
passage_count,0.5,Qwen1.5-7B-Chat,PartialLogQuant_2_128
passage_retrieval_en,24.5,Qwen1.5-7B-Chat,PartialLogQuant_2_128
passage_retrieval_zh,27.5,Qwen1.5-7B-Chat,PartialLogQuant_2_128
qasper,37.13,Qwen1.5-7B-Chat,PartialLogQuant_2_128
qmsum,17.82,Qwen1.5-7B-Chat,PartialLogQuant_2_128
repobench-p,32.55,Qwen1.5-7B-Chat,PartialLogQuant_2_128
samsum,32.62,Qwen1.5-7B-Chat,PartialLogQuant_2_128
trec,67,Qwen1.5-7B-Chat,PartialLogQuant_2_128
triviaqa,87.79,Qwen1.5-7B-Chat,PartialLogQuant_2_128
vcsum,19.26,Qwen1.5-7B-Chat,PartialLogQuant_2_128
2wikimqa,32.32,Qwen1.5-7B-Chat,PartialLogQuant_2_192
dureader,23.61,Qwen1.5-7B-Chat,PartialLogQuant_2_192
gov_report,15.71,Qwen1.5-7B-Chat,PartialLogQuant_2_192
hotpotqa,48.01,Qwen1.5-7B-Chat,PartialLogQuant_2_192
lcc,54.51,Qwen1.5-7B-Chat,PartialLogQuant_2_192
lsht,25.5,Qwen1.5-7B-Chat,PartialLogQuant_2_192
multifieldqa_en,43.95,Qwen1.5-7B-Chat,PartialLogQuant_2_192
multifieldqa_zh,51.49,Qwen1.5-7B-Chat,PartialLogQuant_2_192
multi_news,15,Qwen1.5-7B-Chat,PartialLogQuant_2_192
musique,26.23,Qwen1.5-7B-Chat,PartialLogQuant_2_192
narrativeqa,19.92,Qwen1.5-7B-Chat,PartialLogQuant_2_192
passage_count,0.5,Qwen1.5-7B-Chat,PartialLogQuant_2_192
passage_retrieval_en,24.5,Qwen1.5-7B-Chat,PartialLogQuant_2_192
passage_retrieval_zh,28,Qwen1.5-7B-Chat,PartialLogQuant_2_192
qasper,37.55,Qwen1.5-7B-Chat,PartialLogQuant_2_192
qmsum,17.98,Qwen1.5-7B-Chat,PartialLogQuant_2_192
repobench-p,33.14,Qwen1.5-7B-Chat,PartialLogQuant_2_192
samsum,32.98,Qwen1.5-7B-Chat,PartialLogQuant_2_192
trec,67,Qwen1.5-7B-Chat,PartialLogQuant_2_192
triviaqa,86.68,Qwen1.5-7B-Chat,PartialLogQuant_2_192
vcsum,19.16,Qwen1.5-7B-Chat,PartialLogQuant_2_192
2wikimqa,32.18,Qwen1.5-7B-Chat,PartialLogQuant_2_256
dureader,23.69,Qwen1.5-7B-Chat,PartialLogQuant_2_256
gov_report,15.71,Qwen1.5-7B-Chat,PartialLogQuant_2_256
hotpotqa,48.29,Qwen1.5-7B-Chat,PartialLogQuant_2_256
lcc,54.5,Qwen1.5-7B-Chat,PartialLogQuant_2_256
lsht,25.5,Qwen1.5-7B-Chat,PartialLogQuant_2_256
multifieldqa_en,43.84,Qwen1.5-7B-Chat,PartialLogQuant_2_256
multifieldqa_zh,51.41,Qwen1.5-7B-Chat,PartialLogQuant_2_256
multi_news,14.86,Qwen1.5-7B-Chat,PartialLogQuant_2_256
musique,26.25,Qwen1.5-7B-Chat,PartialLogQuant_2_256
narrativeqa,20.16,Qwen1.5-7B-Chat,PartialLogQuant_2_256
passage_count,0.5,Qwen1.5-7B-Chat,PartialLogQuant_2_256
passage_retrieval_en,22.5,Qwen1.5-7B-Chat,PartialLogQuant_2_256
passage_retrieval_zh,28,Qwen1.5-7B-Chat,PartialLogQuant_2_256
qasper,37.18,Qwen1.5-7B-Chat,PartialLogQuant_2_256
qmsum,17.92,Qwen1.5-7B-Chat,PartialLogQuant_2_256
repobench-p,33.96,Qwen1.5-7B-Chat,PartialLogQuant_2_256
samsum,33.01,Qwen1.5-7B-Chat,PartialLogQuant_2_256
trec,67,Qwen1.5-7B-Chat,PartialLogQuant_2_256
triviaqa,86.57,Qwen1.5-7B-Chat,PartialLogQuant_2_256
vcsum,19.17,Qwen1.5-7B-Chat,PartialLogQuant_2_256
