,Method,coqa_no_context,coqa_no_context,gsm8k_cot,gsm8k_cot,mmlu,mmlu,trivia,trivia,wmt14_fren,wmt14_fren,wmt19_deen,wmt19_deen,xsum,xsum,mean,mean
,,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank
0,IMBA_5_Beta_FeatureWise,0.4227292542725085,18,0.5060453783092244,8,0.5425206515889752,19,0.6981752887608367,18,0.4863456047010888,4,0.6151934497240802,1,0.20987201602831196,13,0.49726880619786085,1
1,IMBA_5_Exp_FeatureWise,0.4188793034900926,22,0.5139404568358557,2,0.5426443580659641,18,0.6976593614267387,19,0.4840595132372574,5,0.6111168328940231,2,0.20780305585554376,16,0.49658612597221075,2
2,Master_1_Exp_FeatureWise,0.4250578967345293,7,0.510720056676844,6,0.5351996286164645,35,0.6946450311660988,21,0.4614144876555846,11,0.5994059990009706,6,0.21454127770453502,11,0.4915691967935753,3
3,Master_1_Beta_FeatureWise,0.4259245695163561,6,0.5070771771154637,7,0.5354697197574454,31,0.6951766817983902,20,0.4611728380246709,12,0.600237147818279,4,0.21498766455213533,10,0.49143511408324864,4
4,IMBA_4_Beta_FeatureWise,0.4232621071683183,16,0.5122159859564503,3,0.5352992706922544,34,0.7045776358452491,1,0.44848125372949216,17,0.5947400679157375,13,0.2195307756408203,8,0.49115815670690316,5
5,IMBA_4_Exp_FeatureWise,0.42353531216689033,13,0.5160134071500391,1,0.5326830829678492,37,0.7044755469561303,2,0.4519724998687274,15,0.5906524500991046,15,0.21648635809594152,9,0.4908312367578117,6
6,CoCoA_like_3_Beta_FeatureWise,0.41003907514220944,37,0.47717173522391043,10,0.5450732670681239,7,0.694086477896991,22,0.49351664865844647,2,0.5987754159540968,8,0.18101367914343325,25,0.4856680427267444,7
7,IMBA_2_Beta_FeatureWise,0.4294247487205681,4,0.51203830491464,4,0.5266622029440289,43,0.7025588157005669,4,0.4171768374105482,29,0.574448551010397,22,0.2257389678974515,2,0.4840069183711715,8
8,CoCoA_like_3_Exp_FeatureWise,0.41583339819513343,33,0.4743167126057099,11,0.5434627272234863,16,0.691980816967883,23,0.4823039949472457,6,0.5976248379497658,9,0.1795847191591232,26,0.48358674386404965,9
9,Master_1_Beta_Global,0.4237197222995125,10,0.44154787876825213,16,0.5360488736184654,25,0.7003489127713889,10,0.45588775263144116,14,0.599279336180481,7,0.22276392611566997,5,0.48279948605503015,10
10,Master_1_Exp_Global,0.42347315453864637,14,0.4420205120717252,15,0.5357326324049798,28,0.6993545571623405,13,0.45639292111137714,13,0.5998766141818351,5,0.22260570147905417,6,0.4827794418499941,11
11,IMBA_2_Exp_FeatureWise,0.4295669992040764,3,0.5113472170611145,5,0.5235049597794207,46,0.7041448004751182,3,0.4142315607176036,30,0.5641994340466646,28,0.22587741606699388,1,0.48183891247871313,12
12,IMBA_2_Beta_Global,0.4233552095661106,15,0.44867104174830325,14,0.527890061547221,39,0.7016759657550078,6,0.4398571563537062,24,0.5971188903383701,11,0.22296234044682356,4,0.48021866653650613,13
13,IMBA_2_Exp_Global,0.423755574894083,9,0.4543567223263276,13,0.525527477925083,45,0.7011395576162279,7,0.4341899963223103,25,0.5973671995196653,10,0.22317475676772733,3,0.47993018362448925,14
14,GreedySemanticEnrichedMTEAveDissimilarity,0.41602788344554137,32,0.5049126755119575,9,0.5278296257044175,40,0.6887830849351071,28,0.4426854165562632,22,0.568280180677606,26,0.20792048457531956,15,0.4794913359151732,15
15,GreedySemanticEnrichedMaxprobAveDissimilarity,0.41002341772499107,38,0.43839452790024663,17,0.5391108023839714,21,0.6987305919150877,16,0.44425626842945215,19,0.5896451946968848,17,0.22206174144551277,7,0.4774603634994495,16
16,GreedySemanticEnrichedPPLAveDissimilarity,0.4211806624824883,20,0.4713186996505482,12,0.5391108023839714,21,0.6826709172748028,35,0.4415499295030166,23,0.5731547767695135,23,0.20908043650107366,14,0.47686660350934496,17
17,CoCoA_like_1_Beta_FeatureWise,0.41853366038340395,24,0.39644547028754806,29,0.545107565041574,6,0.6856135301424001,30,0.49676584745224184,1,0.604912391462563,3,0.15035471796442426,36,0.4711047403905936,18
18,Master_3_Beta_FeatureWise,0.42451538003977723,8,0.40510776305407536,27,0.5354533138269568,32,0.6838365451309522,33,0.46438352107952346,9,0.5925145437269176,14,0.17743522531062783,29,0.4690351845955472,19
19,CoCoA_like_1_Exp_FeatureWise,0.418873757428743,23,0.3812163349811897,36,0.5443469018197764,14,0.6868637774698806,29,0.4902927573788786,3,0.595547803531815,12,0.14660539424883967,41,0.4662495324084462,20
20,Master_3_Exp_FeatureWise,0.42286036967285895,17,0.38694250218672277,33,0.5350180892306398,36,0.6827643573345696,34,0.4641285163704912,10,0.5903602595397651,16,0.1747039992317568,34,0.46525401336668637,21
21,IMBA_3_Beta_FeatureWise,0.42958642595257196,2,0.4362952849596217,18,0.5270931009472776,41,0.6991075463174784,14,0.39504817159310524,36,0.5563584572724707,30,0.2125677070265012,12,0.4651509562955753,22
22,Master_3_Beta_Global,0.4235717331297152,12,0.39207466368758875,32,0.5359438834720271,26,0.6916608328708224,25,0.4456365790286477,18,0.5784981824951984,20,0.1771542244929466,30,0.4635057284538494,23
23,IMBA_3_Exp_FeatureWise,0.4298835778953543,1,0.42881419211334526,20,0.5220885860714576,48,0.7004627899096109,8,0.3945384984064161,37,0.5476271176119109,35,0.20690370289485466,17,0.46147406641470706,24
24,Master_3_Exp_Global,0.42369342262900045,11,0.3651695062667044,40,0.5355307615748703,30,0.6895446163431547,27,0.4518482238273221,16,0.583482282620789,19,0.1754760543662778,32,0.46067783823258834,25
25,IMBA_3_Beta_Global,0.42194055279792547,19,0.3953781046774884,30,0.5165237090530408,51,0.7024903688384337,5,0.40743772621306834,33,0.5661297256139244,27,0.1930132938794473,23,0.45755906872476115,26
26,IMBA_3_Exp_Global,0.4278963282585654,5,0.37053105085848104,39,0.5194554812763086,50,0.6998250177777446,12,0.39324915460621174,39,0.5596615351968417,29,0.19112839335114357,24,0.45167813733218526,27
27,IMBA_4_Exp_Global,0.401660098598813,40,0.4214228916762283,21,0.537459872076076,23,0.700390949222019,9,0.38096539343035773,40,0.5056433440218775,38,0.19983208597905297,19,0.4496249478577749,28
28,IMBA_5_Exp_Global,0.3999374897777233,43,0.4107701780139347,24,0.5446493222496886,13,0.6987326682481834,15,0.3721774012902418,43,0.4938567262004455,43,0.19974607722145346,20,0.44569569471452436,29
29,IMBA_4_Beta_Global,0.4001762625653103,42,0.41270210592197026,23,0.5395662519064957,20,0.7002198956135145,11,0.37057811345963815,44,0.49602959060667695,42,0.199253348986581,21,0.44550365272288384,30
30,IMBA_5_Beta_Global,0.39832292025440513,45,0.40992051697553405,25,0.5448289407340535,12,0.6984872952888823,17,0.3652258530613763,45,0.4875154975062964,45,0.1990235147034516,22,0.4433320769319999,31
31,CoCoA_like_3_Exp_Global,0.3959784028426125,46,0.3976935698832882,28,0.5449315917400732,11,0.691268703985201,26,0.3724611020881105,42,0.4741180043213442,47,0.1778038527067342,28,0.43632217536676626,32
32,CoCoA_like_1_Exp_Global,0.4070390888620179,39,0.35998160469586843,41,0.5450576657965049,8,0.683957435437365,32,0.4038613660122441,34,0.5010751484353445,40,0.14959083512823335,37,0.4357947349096541,33
33,CoCoA_like_3_Beta_Global,0.39484177572046425,47,0.39381756477638147,31,0.5458089202279901,3,0.6918350232324602,24,0.36232113456230325,46,0.4639457160715802,48,0.17833690500852392,27,0.43298671994281474,34
34,GreedyAveDissimilarity,0.4170210997686245,29,0.40654795838600366,26,0.4931399447061957,53,0.6573179502333482,50,0.33231296596581744,51,0.48745650889747155,46,0.20261294673084285,18,0.42805848209832914,35
35,MeanTokenEntropy,0.30486078845476083,56,0.3837720240651879,35,0.543345465926065,17,0.6417926003353303,55,0.42591115406136737,26,0.5317768455418268,36,0.1391610406325325,49,0.42437427414529577,36
36,SAR_t0.001,0.39198522541662023,49,0.3732687652121127,38,0.5201258225509877,49,0.6472068800544056,54,0.3965545979747628,35,0.5030700352333431,39,0.13649209808964696,51,0.42410048921883986,37
37,CoCoA_like_2_Beta_FeatureWise,0.4115263258674258,36,0.1813920925077567,55,0.5449761380085185,10,0.6604960471897744,45,0.47136350199249155,7,0.5851454060265376,18,0.0907181224997205,55,0.4208025191560322,38
38,Master_2_Beta_Global,0.41915502881309075,21,0.19412995458306415,51,0.5361115387331691,24,0.6722411317990544,41,0.4195208911318341,28,0.5521249481244084,32,0.14578754283356427,43,0.4198672908597407,39
39,IMBA_1_Beta_Global,0.41765794366589665,26,0.20404198866512183,50,0.5286422088337523,38,0.6789790687059769,39,0.4115819213369599,31,0.5490741970054557,34,0.14807538352279456,39,0.41972181596227964,40
40,Master_2_Exp_Global,0.41830374293481865,25,0.19347262600178833,52,0.5358566923974161,27,0.6706388716984907,42,0.42104075642604466,27,0.5533486682565661,31,0.1430166554682864,47,0.41938257331191586,41
41,IMBA_1_Exp_Global,0.41700335087813867,30,0.20462622906440756,49,0.5255515456674785,44,0.6787849366330557,40,0.41082959087280996,32,0.5493174908053177,33,0.14775754623845666,40,0.41912438430852356,42
42,Master_2_Beta_FeatureWise,0.417212215426775,28,0.18858036606017164,53,0.5355940422723278,29,0.6595799531801521,46,0.4437698423294608,20,0.5726846359237017,24,0.1127684439101948,53,0.41859849987182624,43
43,Master_2_Exp_FeatureWise,0.4175651775636147,27,0.1879996161891519,54,0.5353161307955765,33,0.6587702334929706,49,0.44298418589687677,21,0.5710808823476775,25,0.11311009286421618,52,0.41811804559286914,44
44,Perplexity,0.3226074196357253,54,0.3430158975017434,44,0.5481107973886685,1,0.6532759152376933,52,0.393926460134514,38,0.5202563368452758,37,0.14438289318394035,46,0.41793938856108015,45
45,CoCoA_like_1_Beta_Global,0.39856961611213043,44,0.35013920573643637,42,0.5456589202276771,5,0.6854778973374763,31,0.35978452514211506,47,0.43731880763522774,51,0.1453714559816997,44,0.4174743468818233,46
46,CoCoA_like_2_Exp_FeatureWise,0.41614273205324187,31,0.1682957109236824,56,0.5437537420089731,15,0.6593171623803534,47,0.4674973359135236,8,0.574466259337844,21,0.08154468721856278,58,0.4158596614051688,47
47,MaximumSequenceProbability,0.3377322321966553,53,0.3860287036271553,34,0.5481107973886685,1,0.6798093485258837,37,0.327803167534366,53,0.41971647345617896,53,0.17678740604550283,31,0.41085544696777293,48
48,IMBA_1_Beta_FeatureWise,0.41454586884848155,35,0.27880023624693734,46,0.5270549724803392,42,0.6792051422632623,38,0.3343211579098993,50,0.4977604995072072,41,0.14203174751999215,48,0.410531374968017,49
49,IMBA_1_Exp_FeatureWise,0.41559603361797975,34,0.2724399335318461,47,0.5231267428693708,47,0.6800261712460123,36,0.33839078325712957,48,0.490179920035626,44,0.13833397140855108,50,0.40829907942378796,50
50,DegMat_NLI_score_entail,0.40087537187393224,41,0.37935366605536136,37,0.4939401906944078,52,0.6625894738660205,43,0.2906251630308511,57,0.43991046319690735,50,0.17417895767120634,35,0.40592475519838384,51
51,CEDegMat,0.39367469304256797,48,0.30309600709031415,45,0.48961412453923386,54,0.6494151598679337,53,0.3097722235363272,55,0.43675152647234083,52,0.1463206809999023,42,0.38980634507837436,52
52,SemanticEntropy,0.3063766663701464,55,0.4204882419270109,22,0.4739140823084939,55,0.5928527116307865,56,0.3233813196710645,54,0.4112275852703827,54,0.14941304946560313,38,0.3825219509490697,53
53,EigValLaplacian_NLI_score_entail,0.3793858871537972,52,0.3482003965575014,43,0.47121281188532466,56,0.6556135117612405,51,0.2411032985281203,58,0.4002087048912466,55,0.17476525055100012,33,0.3814985516183187,54
54,CoCoA_like_2_Exp_Global,0.387730606336458,51,0.15248767079645906,57,0.5450179819308092,9,0.6589877390546026,48,0.33725814580595526,49,0.3959007077431483,56,0.0863289646743901,56,0.36624454519168886,55
55,MonteCarloNormalizedSequenceEntropy,0.30292387887925953,57,0.2704936721364699,48,0.4504534537415151,57,0.5832591559070677,57,0.3809086118443938,41,0.46079063505654394,49,0.10661297706579483,54,0.3650631978044349,56
56,CoCoA_like_2_Beta_Global,0.38816814798285254,50,0.14275051657195686,58,0.5456615429620445,4,0.6619845546054574,44,0.3284242373150087,52,0.38792055794665703,57,0.08393099035743876,57,0.36269150682020224,57
57,MonteCarloSequenceEntropy,0.26674317986384005,58,0.4292497754635891,19,0.42618022078787515,58,0.5620075542864129,58,0.30406907651978793,56,0.35775023061351613,58,0.14487155612945224,45,0.3558387990949248,58
