db_id,dataset_name,seed,lens_unnormalized,lens,test_acc_mean
app_store,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,42,0.4768392857142858,0.4276739440373637,25.4
app_store,llama3.1-8b_zero-shot_bg_v1,42,0.4807678571428572,0.4734801650960354,22.22
app_store,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,42,0.4720559523809525,0.4343070837502916,34.92
app_store,qwen2.5-coder-7b_few-shot_bg_v1,42,0.4719178571428572,0.458108926409846,31.75
app_store,qwen2.5-coder-7b_zero-shot_bg_v1,42,0.4575476190476191,0.4566680730129214,22.22
app_store,llama3.1-8b_few-shot_bg_v1,42,0.4886678571428571,0.4635468204589635,39.68
app_store,llama3.1-8b_zero-shot_bg_test-time-info_v1,42,0.4844392857142857,0.4694923355400928,20.63
app_store,llama3.1-8b_few-shot_bg_test-time-info_v1,42,0.4922619047619047,0.4654517343864739,46.03
movie_platform,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,42,0.4889857142857143,0.4292700931506734,20.36
movie_platform,llama3.1-8b_zero-shot_bg_v1,42,0.4756178571428572,0.4574030038170614,37.72
movie_platform,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,42,0.4926428571428571,0.4470187609415534,43.71
movie_platform,qwen2.5-coder-7b_few-shot_bg_v1,42,0.4833,0.4365583811920673,46.11
movie_platform,qwen2.5-coder-7b_zero-shot_bg_v1,42,0.4875523809523809,0.3938212689709563,16.77
movie_platform,llama3.1-8b_few-shot_bg_v1,42,0.4955011904761904,0.4989285157108833,44.31
movie_platform,llama3.1-8b_zero-shot_bg_test-time-info_v1,42,0.4944464285714285,0.4838441587033756,38.32
movie_platform,llama3.1-8b_few-shot_bg_test-time-info_v1,42,0.4923166666666667,0.4600925814842014,50.9
computer_student,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,42,0.4816940476190476,0.4545465605521983,48.61
computer_student,llama3.1-8b_zero-shot_bg_v1,42,0.4818369047619047,0.4672734773090576,36.11
computer_student,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,42,0.4803928571428572,0.4673523366218796,48.61
computer_student,qwen2.5-coder-7b_few-shot_bg_v1,42,0.4805059523809524,0.4644139303206779,45.83
computer_student,qwen2.5-coder-7b_zero-shot_bg_v1,42,0.4860238095238095,0.4585945348141584,50.0
computer_student,llama3.1-8b_few-shot_bg_v1,42,0.4682678571428571,0.4596796260724873,50.0
computer_student,llama3.1-8b_zero-shot_bg_test-time-info_v1,42,0.4790857142857143,0.4601217290999851,40.28
computer_student,llama3.1-8b_few-shot_bg_test-time-info_v1,42,0.4610357142857142,0.4553190431697198,47.22
app_store,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,43,0.4781607142857143,0.4247077529819926,25.4
app_store,llama3.1-8b_zero-shot_bg_v1,43,0.486,0.4228592068845124,22.22
app_store,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,43,0.4887880952380952,0.450944938888174,34.92
app_store,qwen2.5-coder-7b_few-shot_bg_v1,43,0.4806630952380952,0.425919618720345,31.75
app_store,qwen2.5-coder-7b_zero-shot_bg_v1,43,0.4748392857142858,0.3685001484734231,22.22
app_store,llama3.1-8b_few-shot_bg_v1,43,0.4889964285714285,0.4560181873198539,39.68
app_store,llama3.1-8b_zero-shot_bg_test-time-info_v1,43,0.4821392857142857,0.4386203606880335,20.63
app_store,llama3.1-8b_few-shot_bg_test-time-info_v1,43,0.493075,0.475439173015541,46.03
movie_platform,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,43,0.4939095238095238,0.4860419994264512,20.36
movie_platform,llama3.1-8b_zero-shot_bg_v1,43,0.4851464285714286,0.4712863611852626,37.72
movie_platform,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,43,0.4813285714285715,0.4750395961205421,43.71
movie_platform,qwen2.5-coder-7b_few-shot_bg_v1,43,0.4974059523809523,0.4843080255382384,46.11
movie_platform,qwen2.5-coder-7b_zero-shot_bg_v1,43,0.4775857142857143,0.4585946256915928,16.77
movie_platform,llama3.1-8b_few-shot_bg_v1,43,0.4972535714285714,0.4924540199578583,44.31
movie_platform,llama3.1-8b_zero-shot_bg_test-time-info_v1,43,0.4852,0.470226843122479,38.32
movie_platform,llama3.1-8b_few-shot_bg_test-time-info_v1,43,0.4982678571428571,0.4859849929908899,50.9
computer_student,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,43,0.4927285714285714,0.4390042562589399,48.61
computer_student,llama3.1-8b_zero-shot_bg_v1,43,0.464275,0.4488045094327877,36.11
computer_student,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,43,0.4879285714285714,0.4839153153470817,48.61
computer_student,qwen2.5-coder-7b_few-shot_bg_v1,43,0.5027892857142857,0.4843177855297926,45.83
computer_student,qwen2.5-coder-7b_zero-shot_bg_v1,43,0.4857416666666667,0.4856333067539638,50.0
computer_student,llama3.1-8b_few-shot_bg_v1,43,0.4743416666666666,0.4663067671262278,50.0
computer_student,llama3.1-8b_zero-shot_bg_test-time-info_v1,43,0.4807142857142857,0.4578066924029217,40.28
computer_student,llama3.1-8b_few-shot_bg_test-time-info_v1,43,0.4856714285714286,0.4798996584061242,47.22
app_store,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,44,0.4814642857142858,0.4060686888796422,25.4
app_store,llama3.1-8b_zero-shot_bg_v1,44,0.4960321428571428,0.3724218822929895,22.22
app_store,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,44,0.4837511904761905,0.408767009877069,34.92
app_store,qwen2.5-coder-7b_few-shot_bg_v1,44,0.488575,0.3766571021238259,31.75
app_store,qwen2.5-coder-7b_zero-shot_bg_v1,44,0.4735571428571429,0.4545317866218818,22.22
app_store,llama3.1-8b_few-shot_bg_v1,44,0.4782869047619048,0.4307770029159695,39.68
app_store,llama3.1-8b_zero-shot_bg_test-time-info_v1,44,0.4795178571428572,0.3811025639870642,20.63
app_store,llama3.1-8b_few-shot_bg_test-time-info_v1,44,0.4950380952380953,0.3906144075024794,46.03
movie_platform,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,44,0.4875928571428571,0.4620098786060479,20.36
movie_platform,llama3.1-8b_zero-shot_bg_v1,44,0.4815285714285715,0.4739052695313369,37.72
movie_platform,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,44,0.4894107142857143,0.4580031691456802,43.71
movie_platform,qwen2.5-coder-7b_few-shot_bg_v1,44,0.4855452380952381,0.4786086386723088,46.11
movie_platform,qwen2.5-coder-7b_zero-shot_bg_v1,44,0.4824785714285715,0.4525342061303557,16.77
movie_platform,llama3.1-8b_few-shot_bg_v1,44,0.4953,0.4793009748876956,44.31
movie_platform,llama3.1-8b_zero-shot_bg_test-time-info_v1,44,0.481975,0.4863762171677349,38.32
movie_platform,llama3.1-8b_few-shot_bg_test-time-info_v1,44,0.4957678571428571,0.4880605672404271,50.9
computer_student,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,44,0.4907452380952382,0.4720592127460833,48.61
computer_student,llama3.1-8b_zero-shot_bg_v1,44,0.4830071428571428,0.4726030651444888,36.11
computer_student,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,44,0.4193404761904762,0.3960993334326818,48.61
computer_student,qwen2.5-coder-7b_few-shot_bg_v1,44,0.466,0.4257500698608665,45.83
computer_student,qwen2.5-coder-7b_zero-shot_bg_v1,44,0.4733333333333333,0.4692188690533674,50.0
computer_student,llama3.1-8b_few-shot_bg_v1,44,0.4677107142857143,0.4580137075792728,50.0
computer_student,llama3.1-8b_zero-shot_bg_test-time-info_v1,44,0.5027857142857143,0.4114514372622423,40.28
computer_student,llama3.1-8b_few-shot_bg_test-time-info_v1,44,0.4826178571428571,0.4842806977377261,47.22
app_store,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,45,0.4815892857142858,0.4754664562952959,25.4
app_store,llama3.1-8b_zero-shot_bg_v1,45,0.4706857142857143,0.460434239052828,22.22
app_store,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,45,0.4897321428571429,0.4585224898534237,34.92
app_store,qwen2.5-coder-7b_few-shot_bg_v1,45,0.4768535714285714,0.4135018131634722,31.75
app_store,qwen2.5-coder-7b_zero-shot_bg_v1,45,0.4601071428571429,0.4253380069819414,22.22
app_store,llama3.1-8b_few-shot_bg_v1,45,0.4954107142857143,0.4853481058559765,39.68
app_store,llama3.1-8b_zero-shot_bg_test-time-info_v1,45,0.4822785714285714,0.3136399620657448,20.63
app_store,llama3.1-8b_few-shot_bg_test-time-info_v1,45,0.4827714285714286,0.470484890225457,46.03
movie_platform,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,45,0.4944952380952381,0.4748763682440353,20.36
movie_platform,llama3.1-8b_zero-shot_bg_v1,45,0.4808809523809524,0.4912262988594486,37.72
movie_platform,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,45,0.4890714285714286,0.4805531341877059,43.71
movie_platform,qwen2.5-coder-7b_few-shot_bg_v1,45,0.4806321428571428,0.460190939943108,46.11
movie_platform,qwen2.5-coder-7b_zero-shot_bg_v1,45,0.4810857142857143,0.4131181475202942,16.77
movie_platform,llama3.1-8b_few-shot_bg_v1,45,0.4956214285714285,0.4942767410512537,44.31
movie_platform,llama3.1-8b_zero-shot_bg_test-time-info_v1,45,0.4985928571428571,0.4551401373288135,38.32
movie_platform,llama3.1-8b_few-shot_bg_test-time-info_v1,45,0.4889285714285714,0.4909099922896247,50.9
computer_student,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,45,0.4863857142857143,0.479704925341647,48.61
computer_student,llama3.1-8b_zero-shot_bg_v1,45,0.480495238095238,0.46722479298815,36.11
computer_student,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,45,0.436175,0.4108100454234106,48.61
computer_student,qwen2.5-coder-7b_few-shot_bg_v1,45,0.4925107142857143,0.4785171660750904,45.83
computer_student,qwen2.5-coder-7b_zero-shot_bg_v1,45,0.489447619047619,0.483579467084879,50.0
computer_student,llama3.1-8b_few-shot_bg_v1,45,0.4726833333333333,0.4561494719935513,50.0
computer_student,llama3.1-8b_zero-shot_bg_test-time-info_v1,45,0.4620821428571428,0.4329693500371727,40.28
computer_student,llama3.1-8b_few-shot_bg_test-time-info_v1,45,0.48225,0.4687669803012647,47.22
app_store,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,46,0.4505428571428572,0.4068236307724066,25.4
app_store,llama3.1-8b_zero-shot_bg_v1,46,0.4811321428571429,0.4637282295333979,22.22
app_store,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,46,0.487025,0.4534408259325427,34.92
app_store,qwen2.5-coder-7b_few-shot_bg_v1,46,0.4711071428571429,0.4393921299951059,31.75
app_store,qwen2.5-coder-7b_zero-shot_bg_v1,46,0.4907380952380953,0.4240918299368212,22.22
app_store,llama3.1-8b_few-shot_bg_v1,46,0.5003511904761905,0.4423920361422404,39.68
app_store,llama3.1-8b_zero-shot_bg_test-time-info_v1,46,0.4846035714285714,0.4045212917985201,20.63
app_store,llama3.1-8b_few-shot_bg_test-time-info_v1,46,0.4817500000000001,0.4578235785011156,46.03
movie_platform,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,46,0.4907738095238095,0.4400929110956872,20.36
movie_platform,llama3.1-8b_zero-shot_bg_v1,46,0.4632714285714286,0.465933507376791,37.72
movie_platform,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,46,0.4817321428571429,0.4761654819932623,43.71
movie_platform,qwen2.5-coder-7b_few-shot_bg_v1,46,0.4915357142857143,0.4056268083053204,46.11
movie_platform,qwen2.5-coder-7b_zero-shot_bg_v1,46,0.4859892857142857,0.4790776092287716,16.77
movie_platform,llama3.1-8b_few-shot_bg_v1,46,0.4911285714285714,0.480069457488839,44.31
movie_platform,llama3.1-8b_zero-shot_bg_test-time-info_v1,46,0.4816714285714286,0.4868801301206509,38.32
movie_platform,llama3.1-8b_few-shot_bg_test-time-info_v1,46,0.4898178571428572,0.4676658374199161,50.9
computer_student,qwen2.5-coder-7b_zero-shot_bg_test-time-info_v1,46,0.4863785714285714,0.4713913902322418,48.61
computer_student,llama3.1-8b_zero-shot_bg_v1,46,0.4738714285714285,0.4662444704215748,36.11
computer_student,qwen2.5-coder-7b_few-shot_bg_test-time-info_v1,46,0.4675785714285714,0.4677134487237159,48.61
computer_student,qwen2.5-coder-7b_few-shot_bg_v1,46,0.4795904761904762,0.4302974463634229,45.83
computer_student,qwen2.5-coder-7b_zero-shot_bg_v1,46,0.4863630952380953,0.4838103116235562,50.0
computer_student,llama3.1-8b_few-shot_bg_v1,46,0.4906464285714286,0.4857493164912063,50.0
computer_student,llama3.1-8b_zero-shot_bg_test-time-info_v1,46,0.4712357142857143,0.4242131082831618,40.28
computer_student,llama3.1-8b_few-shot_bg_test-time-info_v1,46,0.4823583333333333,0.4758702855803393,47.22
