,unc_name,dataset,model,nan_values_in_cor,score
0,predent,SQUAD,qwen2_32b_i_0.6,0,0.7645995710794746
1,len_norm_predent,SQUAD,qwen2_32b_i_0.6,0,0.7375887578329923
2,seqlen_sample,SQUAD,qwen2_32b_i_0.6,0,0.5494447386013718
3,seqlen_correct,SQUAD,qwen2_32b_i_0.6,0,0.7910790432768212
4,TOKEN_SAR,SQUAD,qwen2_32b_i_0.6,0,0.6881642224212273
5,SENT_SAR,SQUAD,qwen2_32b_i_0.6,0,0.718290498031324
6,SAR,SQUAD,qwen2_32b_i_0.6,0,0.7253862441249012
7,log_pplx,SQUAD,qwen2_32b_i_0.6,0,0.842661929132205
8,sement,SQUAD,qwen2_32b_i_0.6,0,0.6606911902743209
9,min_logprob,SQUAD,qwen2_32b_i_0.6,11862,0.13333333333333333
10,len_norm_sement,SQUAD,qwen2_32b_i_0.6,0,0.6791631481336451
11,ptrue_neg_log_prob,SQUAD,qwen2_32b_i_0.6,0,0.49891975361188773
12,GNLL,SQUAD,qwen2_32b_i_0.6,0,0.8573751715284847
