,Method,coqa_no_context,coqa_no_context,gsm8k_cot,gsm8k_cot,mmlu,mmlu,trivia,trivia,wmt14_fren,wmt14_fren,wmt19_deen,wmt19_deen,xsum,xsum,mean,mean
,,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank,score,rank
0,IMBA_5_Exp_FeatureWise,0.3539072688626817,28,0.4195943513518368,10,0.48435118748515354,9,0.5971003226095873,35,0.4756605149260609,2,0.6124082889697553,2,0.40542211261547556,8,0.4783491495457931,1
1,IMBA_5_Beta_FeatureWise,0.3559311755679011,27,0.4094022435676103,15,0.48149729155804055,11,0.5992797863161664,30,0.4756884120135038,1,0.613108735819395,1,0.40961240144557487,5,0.4777885780411703,2
2,Master_1_Exp_FeatureWise,0.3568331206384237,23,0.4384188895505521,1,0.4612692485546353,28,0.6059897111371616,19,0.4705490644370739,4,0.5651288492363911,19,0.40839199219393746,6,0.4723686965354536,3
3,Master_1_Beta_FeatureWise,0.35757552940177656,22,0.43052234550484547,4,0.4605135548140211,30,0.6065659339959799,18,0.4705899537311239,3,0.5648647878548656,20,0.410730843691164,2,0.4716232784276824,4
4,Master_1_Exp_Global,0.36831171163567006,18,0.3665045012273101,25,0.4637113658607377,24,0.6082722822165677,15,0.4596903351995628,5,0.5953842121662374,5,0.40027482440881673,13,0.46602131895927185,5
5,Master_1_Beta_Global,0.3689158432322261,16,0.36580775299934604,26,0.4632584532307667,25,0.6080937337743142,16,0.4587753887894021,6,0.5952347107729354,6,0.4006452471715034,11,0.4658187328529277,6
6,GreedySemanticEnrichedMaxprobAveDissimilarity,0.36688944781471106,19,0.3623250674051183,28,0.4915081450689612,3,0.6026024708144654,25,0.44258893191215026,9,0.5840277304265048,9,0.39489736192661967,14,0.46354845076693296,7
7,IMBA_2_Beta_Global,0.3761082343971038,8,0.3680051312837121,23,0.4618374417385124,27,0.6142896699840256,14,0.44099727514479303,11,0.5778446097666027,12,0.40055892385246866,12,0.46280589802388833,8
8,IMBA_2_Exp_Global,0.3770278390470965,7,0.3710167074070598,22,0.46111784484389207,29,0.6164034320583637,10,0.4384094774934149,15,0.5737790414342681,15,0.4014578433340675,9,0.4627445979454518,9
9,IMBA_4_Exp_FeatureWise,0.37945779046944095,5,0.43030151287612145,5,0.47818455076083183,14,0.6191689165355333,8,0.3443281074871054,39,0.5639557116944628,21,0.4104751135126702,3,0.4608388147623094,10
10,CoCoA_like_3_Beta_FeatureWise,0.3361449572100301,43,0.40982001894029085,14,0.4752661557854556,18,0.5948590005343471,36,0.43906793462296406,13,0.5768049740975582,13,0.3882842113730661,16,0.46003532179481604,11
11,IMBA_4_Beta_FeatureWise,0.3799412009134995,4,0.4198053854907241,9,0.4763329826450927,17,0.6194842467025079,7,0.33543212050351034,43,0.5598555464668976,23,0.4147854517292002,1,0.45794813349306185,12
12,CoCoA_like_3_Exp_FeatureWise,0.3399538133349229,42,0.4194868082002068,11,0.4788516694484677,13,0.59132486144735,40,0.44154050680364276,10,0.5761317384257775,14,0.33589836283820634,26,0.45474110864265344,13
13,GreedySemanticEnrichedPPLAveDissimilarity,0.35162899838388906,31,0.4171212700234634,12,0.4576403065274914,36,0.5978727519708046,31,0.4399087443027737,12,0.5089921598735679,40,0.40119992453069664,10,0.4534805936589552,14
14,IMBA_2_Exp_FeatureWise,0.3828520159956502,2,0.43533017649454975,2,0.4559283089953639,39,0.625140220331994,2,0.319404794721741,46,0.5181738420382864,33,0.40674199553378076,7,0.4490816220159095,15
15,IMBA_2_Beta_FeatureWise,0.3806074009502634,3,0.42864734816345734,6,0.45760625675816213,37,0.6236770780956231,6,0.3182931263216277,47,0.5232908711331715,32,0.41009936058867963,4,0.4488887774301407,16
16,GreedySemanticEnrichedMTEAveDissimilarity,0.35051138133315163,33,0.43338099590598866,3,0.4084731351151693,49,0.6038526278859513,24,0.4359246907001319,16,0.5051741627062631,42,0.3920473831494081,15,0.44705205382800906,17
17,Master_3_Beta_FeatureWise,0.3563855164901218,25,0.4119945402721775,13,0.45574208155883783,40,0.6019851666870014,26,0.45075880216351616,8,0.5825377201409542,10,0.2556005811897298,28,0.44500062978604843,18
18,Master_3_Exp_FeatureWise,0.35641486425590896,24,0.4084914286851481,16,0.4560570239996547,38,0.6009838527482936,27,0.4509691356204639,7,0.5807661557125713,11,0.24767212634718042,30,0.44305065533846016,19
19,CoCoA_like_1_Beta_FeatureWise,0.34019915404465023,40,0.3953006465212775,17,0.4721620736739356,20,0.5925790353306328,38,0.43846568842025463,14,0.6111431873644263,3,0.21046376450891394,34,0.4371876499805844,20
20,CoCoA_like_1_Exp_FeatureWise,0.3401824781114157,41,0.39439405906054137,18,0.47659681622513766,16,0.5915005223884485,39,0.43398255446548234,17,0.6029755143729432,4,0.20210905193160084,37,0.4345344280793671,21
21,IMBA_4_Exp_Global,0.3507881701357217,32,0.338916997765958,33,0.48921871779950676,5,0.6000922093326921,28,0.35435921870196324,34,0.524928284284068,31,0.3740949135714406,18,0.4331997873701929,22
22,Master_3_Exp_Global,0.36293528942607356,21,0.35414274605949236,29,0.45907528470038045,34,0.6049647540216267,22,0.4318897773414381,18,0.5942524749450727,7,0.217941624376803,32,0.4321717072672695,23
23,IMBA_4_Beta_Global,0.34807208256446354,34,0.3324097401788327,35,0.4879137676123754,7,0.597837880295155,32,0.34968924087893216,36,0.5151886766563227,37,0.3731971799593897,20,0.42918693830649596,24
24,Master_3_Beta_Global,0.3644339622560227,20,0.3512082955862157,30,0.4590890818936043,33,0.6055626690684881,21,0.4234179859147912,19,0.591117015248646,8,0.2076205899513949,36,0.42892137141702324,25
25,IMBA_5_Exp_Global,0.34313783453762314,38,0.3333717527573117,34,0.4928822756962684,2,0.5894221479201078,43,0.35070773943995853,35,0.5156441040857078,36,0.3736446863683263,19,0.42840150582932907,26
26,IMBA_5_Beta_Global,0.34180464273590777,39,0.33186792237570945,36,0.4914498201400395,4,0.5890691414941723,44,0.34759013868468625,37,0.5105693888574265,39,0.37306200086655733,21,0.42648757930778564,27
27,IMBA_3_Beta_FeatureWise,0.3760738417540506,9,0.4198931662729999,8,0.4536957919423146,42,0.6237151999063811,4,0.31612401793051303,48,0.5176499820477768,34,0.2617187920424076,27,0.42412439884234915,28
28,IMBA_3_Exp_FeatureWise,0.3779128976142238,6,0.42684860006717645,7,0.45214249898517295,44,0.6236974618669752,5,0.31568877079079094,49,0.5110324436940554,38,0.2552003220747977,29,0.42321757072759897,29
29,IMBA_3_Beta_Global,0.37522331646499457,11,0.3507887509275844,31,0.4537538528050185,41,0.6265660492763326,1,0.3811894391884348,27,0.5583644373939286,25,0.2094082487448638,35,0.4221848706858796,30
30,IMBA_3_Exp_Global,0.37329673090076537,13,0.36337827755117774,27,0.4534000043622256,43,0.6247167468323476,3,0.36094424254893726,31,0.5410794110753225,29,0.19968558265755182,38,0.4166429994183325,31
31,CoCoA_like_3_Exp_Global,0.3147146571322594,50,0.31712338673389945,40,0.48868607104373424,6,0.5726457363620613,49,0.3442008196345364,40,0.5165048243599953,35,0.35225953271186994,23,0.41516214685405084,32
32,CoCoA_like_3_Beta_Global,0.3150340552801161,49,0.314538158244811,41,0.48622181023392974,8,0.5701570962096525,50,0.3382637513865656,42,0.5059495477132322,41,0.35200890182999145,24,0.4117390458426141,33
33,CoCoA_like_1_Exp_Global,0.3213016332404753,47,0.326568742894334,37,0.48083231998471415,12,0.5838404420803717,45,0.34392591195425426,41,0.5403154141145828,30,0.22688893968643256,31,0.4033819148507378,34
34,MaximumSequenceProbability,0.2903383764571443,53,0.30990965019320343,42,0.5163742458085981,1,0.5383458026248632,54,0.3202805286566051,45,0.46891341054963714,45,0.3414654095556287,25,0.39794677483509716,35
35,CoCoA_like_1_Beta_Global,0.31717228284742294,48,0.30760206828661646,46,0.4831449722739105,10,0.574003246396224,48,0.32152694124418846,44,0.49415530874616626,43,0.21055072760657628,33,0.3868793639144435,36
36,Master_2_Beta_FeatureWise,0.34618826418099635,37,0.3096464249520601,43,0.44384766987872215,48,0.5907449117360453,41,0.4157694385086533,21,0.5675804485318818,17,0.017415781856668155,51,0.38445613423500385,37
37,Master_2_Exp_FeatureWise,0.3468677657215289,35,0.30818373505585045,45,0.4443684337378429,47,0.5903859543527732,42,0.41686528550840496,20,0.5652006347564031,18,0.017065593100981023,52,0.3841339146048264,38
38,IMBA_1_Exp_Global,0.37033857542106535,14,0.27423213136140595,54,0.467714435281856,23,0.6075249721340303,17,0.37416673131677386,30,0.5500676526121044,28,0.023388485132608914,48,0.38106185475140647,39
39,IMBA_1_Beta_Global,0.3687358445375736,17,0.2719914909932367,55,0.46823943776699467,22,0.605629829146301,20,0.37463716483963794,29,0.5516906916842947,27,0.023985869833427112,47,0.38070147554306655,40
40,Perplexity,0.26097396688929236,55,0.2838139598526605,50,0.4689465460454115,21,0.5197899906919223,55,0.34556911542546687,38,0.4023862968981658,53,0.3828069216159804,17,0.3806123996312714,41
41,Master_2_Exp_Global,0.3535729386807588,29,0.278936010099658,52,0.44946054694447024,45,0.5972581340755363,33,0.3889701787186136,25,0.5589423437377595,24,0.021147415511043807,50,0.37832679539540576,42
42,Master_2_Beta_Global,0.3532385880954817,30,0.27559177088842085,53,0.44918457942671597,46,0.5971742978839111,34,0.38671548745776047,26,0.5581750570997084,26,0.022315052093238256,49,0.3774849761350339,43
43,CoCoA_like_2_Beta_FeatureWise,0.33082439596791446,45,0.2978916751623792,48,0.45911202295119186,32,0.5812835564327669,46,0.390238094776669,24,0.5702465192523958,16,0.011943928647936888,57,0.3773628847416077,44
44,CoCoA_like_2_Exp_FeatureWise,0.33325624428161676,44,0.2799022525144401,51,0.46225516904355496,26,0.5778406544626961,47,0.39113172644565597,23,0.5626861086878694,22,0.012643653496712932,56,0.37424511556179235,45
45,SAR_t0.001,0.32390929085961334,46,0.38903963227020205,19,0.36010371337255964,52,0.5927166807295662,37,0.4121480830449252,22,0.47217989444561254,44,0.05677836173617836,42,0.37241080806552246,46
46,GreedyAveDissimilarity,0.3910022318903868,1,0.36688207117304955,24,0.39513521698957593,50,0.6151586471429527,12,0.37640946759787525,28,0.4503690313569445,48,0.007431241968953817,58,0.3717697011599626,47
47,IMBA_1_Beta_FeatureWise,0.37469576133587146,12,0.3244896263329105,38,0.46018121999991574,31,0.6148014703717338,13,0.2870364897435066,53,0.46123767503981056,46,0.04054568564007815,43,0.36614113263768955,48
48,IMBA_1_Exp_FeatureWise,0.37602955704275276,10,0.32251708546202024,39,0.4577547229167371,35,0.6164600080713202,9,0.28818120904920347,52,0.45810302562250804,47,0.03823426619941381,44,0.36532569633770795,49
49,MeanTokenEntropy,0.24758979168902925,57,0.30842945787917403,44,0.362241203464571,51,0.5058596809486801,56,0.35761329552371274,33,0.3905437960780045,55,0.36724969262769086,22,0.3627895597444089,50
50,CEDegMat,0.3560516331510232,26,0.2983684947263705,47,0.3357519071879287,54,0.6040702536198393,23,0.3111047863747844,50,0.3957786621267919,54,0.06796191408751055,41,0.3384410930391784,51
51,CoCoA_like_2_Exp_Global,0.3027236999572841,52,0.23511532088517864,57,0.4772295974111069,15,0.5623594355347038,51,0.2898020024716065,51,0.4446124968091121,49,0.012701725980811646,55,0.3320777541499719,52
52,CoCoA_like_2_Beta_Global,0.30514767052559805,51,0.22775217049767058,58,0.4747053014186195,19,0.5622247449503776,52,0.2838046327505986,54,0.43524917514560346,50,0.013703001265410575,54,0.32894095665055406,53
53,DegMat_NLI_score_entail,0.369725241029249,15,0.29444832533964466,49,0.3460102868908559,53,0.6159335499960796,11,0.22023565289439534,57,0.3565933206584537,57,0.0755618620238374,39,0.32550117697607367,54
54,SemanticEntropy,0.2890910545198381,54,0.3837266001104885,20,0.23486422319543582,56,0.5407779478539805,53,0.2771823149842847,55,0.4100902971874611,51,0.028615076016741472,45,0.30919250198117576,55
55,MonteCarloNormalizedSequenceEntropy,0.23588400507875787,58,0.3491421464597288,32,0.17101045917379804,58,0.4991360365107927,57,0.3601099644624739,32,0.40689415683048946,52,0.015923900292109036,53,0.29115723840116425,56
56,EigValLaplacian_NLI_score_entail,0.34639530034437827,36,0.2635021980935415,56,0.29554554949669715,55,0.5998074464893319,29,0.15240984285987416,58,0.2833388010446303,58,0.07519106127714023,40,0.2880271713722276,57
57,MonteCarloSequenceEntropy,0.24987767388293983,56,0.37357120242230085,21,0.17378886420914436,57,0.4740192090551184,58,0.2741017480754361,56,0.3839915577174478,56,0.02779974142978589,46,0.2795928566845962,58
