,Method,coqa_no_context,coqa_no_context,gsm8k_cot,gsm8k_cot,mmlu,mmlu,trivia,trivia,wmt14_fren,wmt14_fren,wmt19_deen,wmt19_deen,xsum,xsum,mean,mean
,,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank
0,IMBA_5_Exp_FeatureWise,0.39283672279129545,17,0.5767685872115362,1,0.47296211160298196,17,0.6781396394341549,17,0.4453764061088857,3,0.6403584633980794,2,0.3370481075940242,12,0.5062128625915654,1
1,IMBA_5_Beta_FeatureWise,0.39519610061766314,10,0.5684176644282453,2,0.4723246569696879,18,0.6796751428891746,13,0.4408386425195589,6,0.6425201167899152,1,0.33932598754360727,7,0.5054711873939789,2
2,Master_1_Exp_FeatureWise,0.39209059850861666,19,0.5674035021914363,4,0.46441956541765744,27,0.6801691294732267,8,0.42856160762855294,8,0.6090277074463012,10,0.3423335688221066,6,0.49771509706969974,3
3,Master_1_Beta_FeatureWise,0.3931888023643788,15,0.5634081006863322,6,0.46498615915972746,25,0.6805812183947622,7,0.4292799403785568,7,0.6086780719400008,12,0.343823708314941,5,0.4977065716055285,4
4,Master_1_Exp_Global,0.40133642392595364,6,0.5524476672925981,9,0.46414831224598774,28,0.6825695022274773,1,0.41454740938455825,11,0.6217339428352229,3,0.33844587109596797,9,0.49646130414396655,5
5,Master_1_Beta_Global,0.4020822106236568,5,0.5514067508087196,10,0.4645562172457944,26,0.6823359059852352,2,0.4135623196802083,12,0.6211949045648469,4,0.33770393977232815,10,0.49612032124011274,6
6,IMBA_4_Exp_FeatureWise,0.39604230955982167,9,0.5678710822032282,3,0.4655689735207098,24,0.6808315761388981,6,0.3909500189242942,22,0.6022584942606438,15,0.3475208173208495,3,0.49300618170406363,7
7,IMBA_2_Beta_Global,0.40329432628942186,1,0.5556727780998519,8,0.459898288391955,39,0.6822154579710399,3,0.4006949586879574,14,0.6116514029002197,7,0.33724519981152695,11,0.49295320173599616,8
8,IMBA_2_Exp_Global,0.4025348427849672,4,0.5579080171486416,7,0.45780808883822294,44,0.6817725889800217,4,0.3989706330969435,15,0.6089829031985495,11,0.3390140099480497,8,0.49242729771362803,9
9,IMBA_4_Beta_FeatureWise,0.39683058462430226,8,0.5673219588195068,5,0.46693876177293087,23,0.6811719111801194,5,0.3775429363337399,26,0.603750676606058,14,0.34995082201004185,1,0.4919296644780999,10
10,GreedySemanticEnrichedMaxprobAveDissimilarity,0.4026118060075888,3,0.5479594018152636,11,0.46945722442402316,21,0.6769917496705079,22,0.40212659607812945,13,0.6070222050369081,13,0.33097951180379354,13,0.4910212135480307,11
11,CoCoA_like_3_Beta_FeatureWise,0.3676260543796421,40,0.5091018739470905,19,0.4744088371132423,9,0.6766090808246334,24,0.46398671737251795,2,0.6143086888570308,6,0.31055259254750783,19,0.4880848350059521,12
12,CoCoA_like_3_Exp_FeatureWise,0.37051757834661886,39,0.526321133102412,15,0.4742901711365285,11,0.6742887297260238,29,0.4674269997981928,1,0.6103800072140027,9,0.258001644455203,24,0.48303232339699737,13
13,IMBA_2_Beta_FeatureWise,0.39477481786287166,12,0.5449739438988831,12,0.4588029773419293,43,0.6800554356348143,10,0.35073964010058506,42,0.5749232127417385,20,0.3498639738501386,2,0.4791620002044229,14
14,IMBA_2_Exp_FeatureWise,0.39227619409530584,18,0.5441100665985089,13,0.4552022706030315,48,0.6795013171743759,14,0.35514229175987966,41,0.5648320662732901,25,0.34697587247544653,4,0.47686286842569114,15
15,IMBA_4_Exp_Global,0.3935064580225977,13,0.5307000841585708,14,0.46996291541750207,20,0.6780431177288594,19,0.36469991370425925,32,0.5374317189360487,33,0.31296775377304037,14,0.4696159945344112,16
16,GreedySemanticEnrichedPPLAveDissimilarity,0.38906525833334776,26,0.45877782453260857,34,0.46945722442402316,21,0.6780871706628614,18,0.3963190531944536,18,0.5705221875902282,23,0.3092075877825462,20,0.4673480437885812,17
17,GreedySemanticEnrichedMTEAveDissimilarity,0.3760770116760862,34,0.4895062660899169,24,0.4487557661300187,50,0.6763070996107192,26,0.3966109425422158,17,0.5645517338717979,26,0.3121309195835008,15,0.46627710564346503,18
18,IMBA_4_Beta_Global,0.391973942056012,20,0.5216701542246996,17,0.4701474242242301,19,0.6765611597095789,25,0.3609029142140052,38,0.5302132307531373,37,0.31165272177893383,17,0.46616022099437104,19
19,IMBA_5_Exp_Global,0.3890162180915173,27,0.5226124675497983,16,0.4742150761191853,13,0.6723378923211881,34,0.36225390414630565,36,0.5288872314424785,38,0.31203429560123713,16,0.4659081550388158,20
20,Master_3_Beta_FeatureWise,0.3882129899842291,28,0.4856060168941707,25,0.4641012339993781,29,0.6779216527085654,20,0.4173318260713256,9,0.6012265786460804,16,0.22317366226448704,28,0.4653677086526051,21
21,CoCoA_like_1_Beta_FeatureWise,0.3732594672794196,36,0.47962761874404897,29,0.4743294047259695,10,0.6754757403424647,27,0.44308389803708187,4,0.6200450974999634,5,0.1903530643484991,33,0.46516775585392095,22
22,IMBA_5_Beta_Global,0.389129657527245,25,0.5211488668991531,18,0.47369324411588565,15,0.671273521260005,37,0.3592154723056992,39,0.5256157494602641,39,0.311199519675439,18,0.46446800446338443,23
23,Master_3_Exp_FeatureWise,0.3877336664199576,29,0.47872892004572015,31,0.4636590924159138,32,0.6773027847356099,21,0.4163100593322527,10,0.6000616681112977,17,0.2172128796444104,29,0.4630012958150232,24
24,CoCoA_like_1_Exp_FeatureWise,0.37369749297888605,35,0.47106184073397345,32,0.4751939055658202,5,0.6744004865275909,28,0.4423897007296651,5,0.6104942576486749,8,0.15855487913635583,38,0.45797036618870945,25
25,Master_3_Exp_Global,0.3949508882311248,11,0.4542006628661518,35,0.46395881852371906,31,0.6799745122179354,12,0.3915318444466938,21,0.5910620126268025,18,0.19577218030889867,31,0.45306441703161804,26
26,CoCoA_like_3_Exp_Global,0.3573244536694625,44,0.49824997695967527,20,0.47557600904480096,3,0.6701426556495169,40,0.3635577845152398,34,0.5161038330390634,42,0.2867247923510393,21,0.45252564360411396,27
27,CoCoA_like_3_Beta_Global,0.36195056600710124,42,0.4948661078246094,22,0.475190823918471,6,0.6689275910391633,42,0.3551652529978038,40,0.5081016359698677,43,0.28498190752745567,22,0.44988341218349603,28
28,Master_3_Beta_Global,0.39799705583906375,7,0.44399937224261954,37,0.4640036093403834,30,0.6800357679774521,11,0.38587882548378555,25,0.5816981798548625,19,0.1813582023216081,36,0.44785300186568217,29
29,IMBA_3_Beta_FeatureWise,0.3906986164993023,22,0.4845585509062311,26,0.4593490889842298,41,0.6791973059425176,15,0.3323837815009234,47,0.5449537053409176,32,0.23674132276722867,25,0.4468403388487644,30
30,IMBA_3_Exp_FeatureWise,0.38981419289101926,23,0.4795319070551158,30,0.4563318617735527,45,0.6787061203151492,16,0.3335387139397081,46,0.5361159812601392,36,0.22409097510032555,27,0.4425899646192871,31
31,IMBA_3_Exp_Global,0.38964607362164916,24,0.4541208739668431,36,0.45538376263049074,47,0.680068462437014,9,0.349687846761275,43,0.5463473678351519,30,0.18398381950370804,34,0.4370340295365903,32
32,IMBA_3_Beta_Global,0.39105669259288217,21,0.4328255035635728,38,0.45436953926778756,49,0.676784515504967,23,0.36097916771363536,37,0.5595881150229068,28,0.18306800148717595,35,0.43695307645041825,33
33,MaximumSequenceProbability,0.34977722673381795,50,0.4905525706236685,23,0.4784266255654024,1,0.6335729723469893,53,0.3319082264822418,48,0.4728609125194713,47,0.2779090540697339,23,0.43357251262018925,34
34,CoCoA_like_1_Exp_Global,0.3581798592031525,43,0.39630153210136115,42,0.4754219084442899,4,0.6718132311740053,35,0.36574373264243215,31,0.5229640484957688,40,0.19447687216494866,32,0.4264144548894226,35
35,Master_2_Beta_FeatureWise,0.37257965969283147,37,0.3874584284945546,45,0.4630150266178112,34,0.6705598874277487,39,0.3935572122759398,20,0.5725705311928232,21,0.06397334128528223,45,0.41767344099814163,36
36,Master_2_Exp_FeatureWise,0.3713597695269969,38,0.3870303187604042,46,0.46229901066147855,37,0.6699189267580926,41,0.3944354915777308,19,0.5723304155234343,22,0.06352788669324849,46,0.41727168850019797,37
37,CoCoA_like_2_Beta_FeatureWise,0.3563272535622567,45,0.39361069162939377,43,0.47340812687948197,16,0.6681440953618687,43,0.38874505677920557,23,0.5703437986717298,24,0.04997092591547309,48,0.4143642783999157,38
38,CoCoA_like_2_Exp_FeatureWise,0.3544133161159357,47,0.39648861672235086,41,0.47382916599400937,14,0.6669604992678975,45,0.38771772931802395,24,0.5614088790045673,27,0.04534005032344431,49,0.4123083223923184,39
39,CoCoA_like_1_Beta_Global,0.3624375594899686,41,0.3691892627186965,48,0.47480771264579824,8,0.6673795517188611,44,0.3364254881035563,45,0.47039882633264235,48,0.17673853182657662,37,0.4081967046908713,40
40,SAR_t0.001,0.3322779071267751,52,0.48349775712891,27,0.41832765318875986,52,0.6377071422617052,51,0.37154251017184614,29,0.519274497549691,41,0.0888869353617661,42,0.4073592003984934,41
41,GreedyAveDissimilarity,0.4028663501474562,2,0.46471984213028966,33,0.42654204276296226,51,0.6521258000318666,48,0.3055292557029677,50,0.49947111655523635,44,0.06347794528520662,47,0.4021046218022836,42
42,Perplexity,0.2888826579883211,55,0.27995450428689517,55,0.4784266255654024,1,0.6361344298081747,52,0.3699330168336485,30,0.48377642119232067,45,0.2259527405155309,26,0.39472291374147045,43
43,Master_2_Exp_Global,0.383406345246175,32,0.2865614639378643,51,0.4625829733559396,36,0.6732350382521577,31,0.37389959733999806,27,0.5468749677693304,29,0.029204958009097996,50,0.3936807634157947,44
44,Master_2_Beta_Global,0.3848309536827403,30,0.28293650803471343,52,0.46302528739210047,33,0.6731833584389915,32,0.3722421239087919,28,0.5451968299579772,31,0.02718347423075367,51,0.3926569336637241,45
45,MeanTokenEntropy,0.251966845197086,58,0.3255302706376313,50,0.4591048180710494,42,0.6230201416173752,54,0.3969208733117502,16,0.4770982876233739,46,0.20323395215169357,30,0.39098216980142275,46
46,IMBA_1_Beta_Global,0.3930611163707224,16,0.2807161866347911,54,0.46259370069674854,35,0.673419151665272,30,0.3633453298270568,35,0.537287261950729,35,0.022947721834178765,53,0.39048149556849976,47
47,IMBA_1_Exp_Global,0.3933760657492765,14,0.2822502969301961,53,0.4596818145976444,40,0.6726992978556086,33,0.3637071557618427,33,0.5373839979331287,34,0.02368913937355492,52,0.39039825260017885,48
48,IMBA_1_Beta_FeatureWise,0.38443815113072205,31,0.3993730986708466,40,0.4609583738553157,38,0.6718042419423025,36,0.2862414482317674,54,0.4529953478996618,50,0.07050812185690424,44,0.38947411194107434,49
49,IMBA_1_Exp_FeatureWise,0.38336121672800666,33,0.38040044798172157,47,0.45622881597793374,46,0.6712636695272813,38,0.28973405533397767,52,0.4466152342530626,52,0.07289342497568996,43,0.38578526639681054,50
50,CEDegMat,0.3437535125908797,51,0.391923490797378,44,0.40290242753798783,54,0.6414144226636476,50,0.28687405801263594,53,0.4513508201646404,51,0.12259399144618104,41,0.37725896045905005,51
51,DegMat_NLI_score_entail,0.35181287057542293,48,0.32728879607551054,49,0.4100131555615904,53,0.6511365432425319,49,0.22368675466070773,57,0.3849678136204714,56,0.13000045856093514,39,0.35412948461388144,52
52,CoCoA_like_2_Exp_Global,0.3499799895580218,49,0.22481206624239425,57,0.47493986623369217,7,0.655231612840818,47,0.3073158131664309,49,0.41014925620207826,53,-0.00916118305793277,57,0.3447524887407861,53
53,SemanticEntropy,0.2937160369686372,54,0.4829880718466227,28,0.3871396606395704,56,0.5646499030281426,56,0.27354559678512735,55,0.40856020042438407,54,-0.0071341862904719415,55,0.3433521833431446,54
54,CoCoA_like_2_Beta_Global,0.35582607691614626,46,0.22188046734146613,58,0.4742244603339501,12,0.6556184536923192,46,0.30212108189841713,51,0.4030993618802545,55,-0.00940698608649641,58,0.34333755942515104,55
55,MonteCarloNormalizedSequenceEntropy,0.26119878527319484,57,0.4102680399860182,39,0.36053234232002224,57,0.5339639795940192,57,0.343332490912385,44,0.4660846326708116,49,0.006537174670138541,54,0.34027392077522706,56
56,EigValLaplacian_NLI_score_entail,0.3157093887956531,53,0.26435930269818747,56,0.4012606027205103,55,0.6215662100493088,55,0.2007932943477858,58,0.33049427729543424,58,0.12615690777894864,40,0.3229057119551183,57
57,MonteCarloSequenceEntropy,0.26766420059766316,56,0.49549113159903013,21,0.3415133181292738,58,0.4975402664908539,58,0.26352591496122285,56,0.36999598915755977,57,-0.0075796678961627464,56,0.318307307577063,58
