,unc_name,dataset,model,nan_values_in_cor,score
0,predent,SQUAD,phi35_i_1.,0,0.6608823260681301
1,len_norm_predent,SQUAD,phi35_i_1.,0,0.5894079103432386
2,seqlen_sample,SQUAD,phi35_i_1.,0,0.6296889276305859
3,seqlen_correct,SQUAD,phi35_i_1.,0,0.6117122316692943
4,EigenScore,SQUAD,phi35_i_1.,0,0.6760114789302297
5,TOKEN_SAR,SQUAD,phi35_i_1.,0,0.55955507298686
6,SENT_SAR,SQUAD,phi35_i_1.,0,0.6466591528961498
7,SAR,SQUAD,phi35_i_1.,0,0.580230171647661
8,log_pplx,SQUAD,phi35_i_1.,0,0.63789384869627
9,sement,SQUAD,phi35_i_1.,0,0.6489978281571173
10,min_logprob,SQUAD,phi35_i_1.,0,0.6315000073775692
11,len_norm_sement,SQUAD,phi35_i_1.,0,0.6781115323892315
12,ptrue_neg_log_prob,SQUAD,phi35_i_1.,0,0.5624461437445591
13,GNLL,SQUAD,phi35_i_1.,0,0.6562704656608203
14,predent,SQUAD,llama3_8b_i_1.,0,0.6649673854689127
15,len_norm_predent,SQUAD,llama3_8b_i_1.,0,0.5923326483544048
16,seqlen_sample,SQUAD,llama3_8b_i_1.,0,0.5843909220713036
17,seqlen_correct,SQUAD,llama3_8b_i_1.,0,0.601838873320326
18,EigenScore,SQUAD,llama3_8b_i_1.,0,0.6819461091267343
19,TOKEN_SAR,SQUAD,llama3_8b_i_1.,0,0.6095956496176718
20,SENT_SAR,SQUAD,llama3_8b_i_1.,0,0.7082792784510283
21,SAR,SQUAD,llama3_8b_i_1.,0,0.6439895227166708
22,log_pplx,SQUAD,llama3_8b_i_1.,1,0.6951002404783856
23,sement,SQUAD,llama3_8b_i_1.,0,0.6668779630871835
24,min_logprob,SQUAD,llama3_8b_i_1.,1,0.66233782395654
25,len_norm_sement,SQUAD,llama3_8b_i_1.,0,0.7085678265340521
26,ptrue_neg_log_prob,SQUAD,llama3_8b_i_1.,0,0.7779973503176327
27,GNLL,SQUAD,llama3_8b_i_1.,1,0.682698369835522
28,predent,KUQ,llama3_8b_i_1.,0,0.7183765063192671
29,len_norm_predent,KUQ,llama3_8b_i_1.,0,0.26257782443804467
30,seqlen_sample,KUQ,llama3_8b_i_1.,0,0.8451096064694359
31,seqlen_correct,KUQ,llama3_8b_i_1.,0,0.7903378978182358
32,EigenScore,KUQ,llama3_8b_i_1.,0,0.759888486351239
33,TOKEN_SAR,KUQ,llama3_8b_i_1.,0,0.7092374920646738
34,SENT_SAR,KUQ,llama3_8b_i_1.,0,0.6536605815027323
35,SAR,KUQ,llama3_8b_i_1.,0,0.6920373427315618
36,log_pplx,KUQ,llama3_8b_i_1.,23,0.6060002171959729
37,sement,KUQ,llama3_8b_i_1.,0,0.3782148041851423
38,min_logprob,KUQ,llama3_8b_i_1.,23,0.5544708975241188
39,len_norm_sement,KUQ,llama3_8b_i_1.,0,0.7198935558440592
40,ptrue_neg_log_prob,KUQ,llama3_8b_i_1.,0,0.6689811948489024
41,GNLL,KUQ,llama3_8b_i_1.,23,0.7863393250303743
42,predent,KUQ,phi35_i_1.,0,0.7357775446452575
43,len_norm_predent,KUQ,phi35_i_1.,0,0.4174557679154788
44,seqlen_sample,KUQ,phi35_i_1.,0,0.8726851658418823
45,seqlen_correct,KUQ,phi35_i_1.,0,0.8309846202594523
46,EigenScore,KUQ,phi35_i_1.,0,0.7724862519760767
47,TOKEN_SAR,KUQ,phi35_i_1.,0,0.8049303729723611
48,SENT_SAR,KUQ,phi35_i_1.,0,0.7268568072543546
49,SAR,KUQ,phi35_i_1.,0,0.8066876452172087
50,log_pplx,KUQ,phi35_i_1.,0,0.7825839203216858
51,sement,KUQ,phi35_i_1.,0,0.5190133413081199
52,min_logprob,KUQ,phi35_i_1.,0,0.6482376337842617
53,len_norm_sement,KUQ,phi35_i_1.,0,0.6379204224678638
54,ptrue_neg_log_prob,KUQ,phi35_i_1.,0,0.4163632018970673
55,GNLL,KUQ,phi35_i_1.,0,0.8562395319320228
56,predent,SQUAD,llama3_8b_1.,0,0.4549090203836563
57,len_norm_predent,SQUAD,llama3_8b_1.,0,0.4129559905294712
58,seqlen_sample,SQUAD,llama3_8b_1.,0,0.48522697091762196
59,seqlen_correct,SQUAD,llama3_8b_1.,0,0.5334792815155569
60,EigenScore,SQUAD,llama3_8b_1.,0,0.49120495852103574
61,TOKEN_SAR,SQUAD,llama3_8b_1.,0,0.5010499132284356
62,SENT_SAR,SQUAD,llama3_8b_1.,1,0.4897593605318556
63,SAR,SQUAD,llama3_8b_1.,79,0.4727352877370471
64,log_pplx,SQUAD,llama3_8b_1.,0,0.4717712210104092
65,sement,SQUAD,llama3_8b_1.,0,0.4155524692724241
66,min_logprob,SQUAD,llama3_8b_1.,0,0.5244191441111674
67,len_norm_sement,SQUAD,llama3_8b_1.,0,0.5261479639611417
68,ptrue_neg_log_prob,SQUAD,llama3_8b_1.,0,0.5005219913988892
69,GNLL,SQUAD,llama3_8b_1.,0,0.5274860847694056
70,predent,SQUAD,llama3_70b_i_1.,0,0.6802423725830212
71,len_norm_predent,SQUAD,llama3_70b_i_1.,0,0.6058768008449872
72,seqlen_sample,SQUAD,llama3_70b_i_1.,0,0.6167682909423174
73,seqlen_correct,SQUAD,llama3_70b_i_1.,0,0.5811328108330529
74,EigenScore,SQUAD,llama3_70b_i_1.,0,0.6950022319096538
75,TOKEN_SAR,SQUAD,llama3_70b_i_1.,0,0.6499249788703197
76,SENT_SAR,SQUAD,llama3_70b_i_1.,0,0.7211742151037078
77,SAR,SQUAD,llama3_70b_i_1.,0,0.673703388544941
78,log_pplx,SQUAD,llama3_70b_i_1.,0,0.44948658981784073
79,sement,SQUAD,llama3_70b_i_1.,0,0.660880415219382
80,min_logprob,SQUAD,llama3_70b_i_1.,0,0.6075000679781718
81,len_norm_sement,SQUAD,llama3_70b_i_1.,0,0.6980050608015154
82,ptrue_neg_log_prob,SQUAD,llama3_70b_i_1.,0,0.8582512711273013
83,GNLL,SQUAD,llama3_70b_i_1.,0,0.6769070554375135
