model_class,metric,score,pvalue,eff_size
vicuna-7b,v_wn_lda,0.43098693573235225,0.0,0
vicuna-7b,v_s_wn_lda,0.35644845724716495,0.0,0
vicuna-7b,v_wn_mean,0.4223863476423738,0.0,0
vicuna-7b,v_s_wn_mean,0.3557508564391579,0.0,0
vicuna-7b,l_wn_lda,0.43176340857789214,0.0,0
vicuna-7b,l_s_wn_lda,0.3672364803888895,0.0,0
vicuna-7b,l_wn_mean,0.42287107453552375,0.0,0
vicuna-7b,l_s_wn_mean,0.3683927856228824,0.0,0
vicuna-7b,v_l_lda,0.9998238658693345,0.0,0
vicuna-7b,v_l_mean,0.9998569186409069,0.0,0
vicuna-7b,v_l_non_param_lda_diff,-0.0007741542337466273,5.767203615817138e-18,0.8637072007139313
vicuna-7b,v_l_non_param_diff,-0.0005350736847541687,2.964263914228315e-17,0.8447964140740961
vicuna-7b,v_l_non_param_diff_sims,0.0004860087252698231,5.880974579924446e-92,8.035001332957505
vicuna-7b,v_l_sampled_rsa_mean,0.9998178731310527,0,0
vicuna-7b,v_l_sampled_rsa_sd,2.5523518546410027e-05,0,0
vicuna-7b,v_wn_lda_rsa_mean,0.42973662723877587,0,0
vicuna-7b,v_wn_lda_rsa_sd,0.035146932718527535,0,0
vicuna-7b,l_wn_lda_rsa_mean,0.43071524249210474,0,0
vicuna-7b,l_wn_lda_rsa_sd,0.035283797133345826,0,0
qwen-2-7b-molmo,v_wn_lda,0.3789939773180567,0.0,0
qwen-2-7b-molmo,v_s_wn_lda,0.2313890676843828,0.0,0
qwen-2-7b-molmo,v_wn_mean,0.3759697348428725,0.0,0
qwen-2-7b-molmo,v_s_wn_mean,0.23457551138205185,0.0,0
qwen-2-7b-molmo,l_wn_lda,0.39902734676090384,0.0,0
qwen-2-7b-molmo,l_s_wn_lda,0.2309114120837236,0.0,0
qwen-2-7b-molmo,l_wn_mean,0.38972124078196363,0.0,0
qwen-2-7b-molmo,l_s_wn_mean,0.233461337052897,0.0,0
qwen-2-7b-molmo,v_l_lda,0.961095735606977,0.0,0
qwen-2-7b-molmo,v_l_mean,0.9544470346108808,0.0,0
qwen-2-7b-molmo,v_l_non_param_lda_diff,-0.02153495647783005,4.9610417082651575e-18,0.8654263631357347
qwen-2-7b-molmo,v_l_non_param_diff,-0.013893328686485937,3.67462457090672e-16,0.8148829879347202
qwen-2-7b-molmo,v_l_non_param_diff_sims,0.0003228004386718641,0.0026867845423649197,0.3079128333788507
qwen-2-7b-molmo,v_l_sampled_rsa_mean,0.9609019317234149,0,0
qwen-2-7b-molmo,v_l_sampled_rsa_sd,0.006543383088944044,0,0
qwen-2-7b-molmo,v_wn_lda_rsa_mean,0.38342337476975685,0,0
qwen-2-7b-molmo,v_wn_lda_rsa_sd,0.04485200776102888,0,0
qwen-2-7b-molmo,l_wn_lda_rsa_mean,0.3914889728342545,0,0
qwen-2-7b-molmo,l_wn_lda_rsa_sd,0.04243134739811036,0,0
llama-3.1-8b,v_wn_lda,0.4035733137272634,0.0,0
llama-3.1-8b,v_s_wn_lda,0.2297189589395017,0.0,0
llama-3.1-8b,v_wn_mean,0.3894417459205329,0.0,0
llama-3.1-8b,v_s_wn_mean,0.23052942356360043,0.0,0
llama-3.1-8b,l_wn_lda,0.4055494753264072,0.0,0
llama-3.1-8b,l_s_wn_lda,0.2293107258275358,0.0,0
llama-3.1-8b,l_wn_mean,0.39082230501056653,0.0,0
llama-3.1-8b,l_s_wn_mean,0.23006398503448208,0.0,0
llama-3.1-8b,v_l_lda,0.9993752896108025,0.0,0
llama-3.1-8b,v_l_mean,0.9996115841586766,0.0,0
llama-3.1-8b,v_l_non_param_lda_diff,-0.0018683401574883906,8.777880718979924e-18,0.8588935459328824
llama-3.1-8b,v_l_non_param_diff,-0.0013251120704892555,6.504110965076778e-18,0.8623318707764888
llama-3.1-8b,v_l_non_param_diff_sims,0.0016931290800581966,3.78198399552124e-105,10.958278515541295
llama-3.1-8b,v_l_sampled_rsa_mean,0.9993660689758612,0,0
llama-3.1-8b,v_l_sampled_rsa_sd,0.0001077613815952344,0,0
llama-3.1-8b,v_wn_lda_rsa_mean,0.39881475056991816,0,0
llama-3.1-8b,v_wn_lda_rsa_sd,0.04486769840118984,0,0
llama-3.1-8b,l_wn_lda_rsa_mean,0.40784301434110437,0,0
llama-3.1-8b,l_wn_lda_rsa_sd,0.042770846610338815,0,0
qwen-2-7b-llava-ov,v_wn_lda,0.39642585414681736,0.0,0
qwen-2-7b-llava-ov,v_s_wn_lda,0.23989296439663532,0.0,0
qwen-2-7b-llava-ov,v_wn_mean,0.3913961087791058,0.0,0
qwen-2-7b-llava-ov,v_s_wn_mean,0.24722557493000033,0.0,0
qwen-2-7b-llava-ov,l_wn_lda,0.39840131851454913,0.0,0
qwen-2-7b-llava-ov,l_s_wn_lda,0.232241692174906,0.0,0
qwen-2-7b-llava-ov,l_wn_mean,0.38996743745108575,0.0,0
qwen-2-7b-llava-ov,l_s_wn_mean,0.23462591571592337,0.0,0
qwen-2-7b-llava-ov,v_l_lda,0.9955533835464553,0.0,0
qwen-2-7b-llava-ov,v_l_mean,0.9958153313228961,0.0,0
qwen-2-7b-llava-ov,v_l_non_param_lda_diff,-0.002263940549239179,4.4702031274545934e-09,0.5865782183192543
qwen-2-7b-llava-ov,v_l_non_param_diff,0.001251155435273375,0.0016354699829627477,0.31495055567434765
qwen-2-7b-llava-ov,v_l_non_param_diff_sims,0.004174898110254486,4.536976910835538e-82,6.355952476292396
qwen-2-7b-llava-ov,v_l_sampled_rsa_mean,0.9954172229281213,0,0
qwen-2-7b-llava-ov,v_l_sampled_rsa_sd,0.0006986768374957617,0,0
qwen-2-7b-llava-ov,v_wn_lda_rsa_mean,0.4000790518358586,0,0
qwen-2-7b-llava-ov,v_wn_lda_rsa_sd,0.04416240593245944,0,0
qwen-2-7b-llava-ov,l_wn_lda_rsa_mean,0.3978052341644854,0,0
qwen-2-7b-llava-ov,l_wn_lda_rsa_sd,0.04967227658683531,0,0
llama-3.1-8b-instruct,v_wn_lda,0.40357329734968517,0.0,0
llama-3.1-8b-instruct,v_s_wn_lda,0.22971899992891154,0.0,0
llama-3.1-8b-instruct,v_wn_mean,0.38944174177781266,0.0,0
llama-3.1-8b-instruct,v_s_wn_mean,0.23052941592657603,0.0,0
llama-3.1-8b-instruct,l_wn_lda,0.4035727747745303,0.0,0
llama-3.1-8b-instruct,l_s_wn_lda,0.22973013199630576,0.0,0
llama-3.1-8b-instruct,l_wn_mean,0.3894340533706026,0.0,0
llama-3.1-8b-instruct,l_s_wn_mean,0.230541912950993,0.0,0
llama-3.1-8b-instruct,v_l_lda,0.999999871305479,0.0,0
llama-3.1-8b-instruct,v_l_mean,0.9999999357035961,0.0,0
llama-3.1-8b-instruct,v_l_non_param_lda_diff,1.0753684404402053e-06,0.4270481369484205,0.07942530388730819
llama-3.1-8b-instruct,v_l_non_param_diff,7.95917113711797e-06,1.3460606544893094e-08,0.5680112641637797
llama-3.1-8b-instruct,v_l_non_param_diff_sims,-5.364868541635204e-07,3.8600786589407823e-13,-0.8369143882526682
llama-3.1-8b-instruct,v_l_sampled_rsa_mean,0.9999997095702545,0,0
llama-3.1-8b-instruct,v_l_sampled_rsa_sd,4.251585833634897e-08,0,0
llama-3.1-8b-instruct,v_wn_lda_rsa_mean,0.4043005124639772,0,0
llama-3.1-8b-instruct,v_wn_lda_rsa_sd,0.04040307344223789,0,0
llama-3.1-8b-instruct,l_wn_lda_rsa_mean,0.39905513765473005,0,0
llama-3.1-8b-instruct,l_wn_lda_rsa_sd,0.044948347244516365,0,0
mistral-7b,v_wn_lda,0.41820237208124117,0.0,0
mistral-7b,v_s_wn_lda,0.3615370378404426,0.0,0
mistral-7b,v_wn_mean,0.41021400151771076,0.0,0
mistral-7b,v_s_wn_mean,0.3623325117831992,0.0,0
mistral-7b,l_wn_lda,0.41826133813125854,0.0,0
mistral-7b,l_s_wn_lda,0.3402591318305075,0.0,0
mistral-7b,l_wn_mean,0.4101786304693142,0.0,0
mistral-7b,l_s_wn_mean,0.3389987648284931,0.0,0
mistral-7b,v_l_lda,0.999844233541223,0.0,0
mistral-7b,v_l_mean,0.9998770314457407,0.0,0
mistral-7b,v_l_non_param_lda_diff,-0.00011183731941161346,0.00653382133312757,0.27197149512926744
mistral-7b,v_l_non_param_diff,0.00010439220126794102,0.006137474165144637,0.27403449003543123
mistral-7b,v_l_non_param_diff_sims,0.00020469064189865716,6.44995750103625e-65,4.201391258275199
mistral-7b,v_l_sampled_rsa_mean,0.9998386654174105,0,0
mistral-7b,v_l_sampled_rsa_sd,2.5917318272566647e-05,0,0
mistral-7b,v_wn_lda_rsa_mean,0.41862876756573064,0,0
mistral-7b,v_wn_lda_rsa_sd,0.03555477389193968,0,0
mistral-7b,l_wn_lda_rsa_mean,0.41787393616442264,0,0
mistral-7b,l_wn_lda_rsa_sd,0.0322642630120623,0,0
qwen-2.5-7b-instruct,v_wn_lda,0.3787515657699921,0.0,0
qwen-2.5-7b-instruct,v_s_wn_lda,0.23600899036092574,0.0,0
qwen-2.5-7b-instruct,v_wn_mean,0.38057642260701036,0.0,0
qwen-2.5-7b-instruct,v_s_wn_mean,0.23938652413428868,0.0,0
qwen-2.5-7b-instruct,l_wn_lda,0.4003356907946703,0.0,0
qwen-2.5-7b-instruct,l_s_wn_lda,0.2340388064906284,0.0,0
qwen-2.5-7b-instruct,l_wn_mean,0.39072136296339616,0.0,0
qwen-2.5-7b-instruct,l_s_wn_mean,0.2365796672558952,0.0,0
qwen-2.5-7b-instruct,v_l_lda,0.9561153351400489,0.0,0
qwen-2.5-7b-instruct,v_l_mean,0.9564832174446211,0.0,0
qwen-2.5-7b-instruct,v_l_non_param_lda_diff,-0.02200722044542715,4.813701823147399e-18,0.8657701956200953
qwen-2.5-7b-instruct,v_l_non_param_diff,-0.00963378984173658,1.066761824101504e-10,0.6457174056292847
qwen-2.5-7b-instruct,v_l_non_param_diff_sims,-0.034086128588675574,1.7996532196170874e-120,-15.68255787302068
qwen-2.5-7b-instruct,v_l_sampled_rsa_mean,0.9553693391185634,0,0
qwen-2.5-7b-instruct,v_l_sampled_rsa_sd,0.0063747079252154506,0,0
qwen-2.5-7b-instruct,v_wn_lda_rsa_mean,0.37515556305269376,0,0
qwen-2.5-7b-instruct,v_wn_lda_rsa_sd,0.04696156451152322,0,0
qwen-2.5-7b-instruct,l_wn_lda_rsa_mean,0.3968146457320206,0,0
qwen-2.5-7b-instruct,l_wn_lda_rsa_sd,0.04181592072089659,0,0
smollm2-135m,v_wn_lda,0.3977426789326964,0.0,0
smollm2-135m,v_s_wn_lda,0.1716190020273645,0.0,0
smollm2-135m,v_wn_mean,0.36708362823611723,0.0,0
smollm2-135m,v_s_wn_mean,0.17132198266196577,0.0,0
smollm2-135m,l_wn_lda,0.39343642961904235,0.0,0
smollm2-135m,l_s_wn_lda,0.17016726248792202,0.0,0
smollm2-135m,l_wn_mean,0.3643969076946448,0.0,0
smollm2-135m,l_s_wn_mean,0.17046040226774398,0.0,0
smollm2-135m,v_l_lda,0.9873941028228129,0.0,0
smollm2-135m,v_l_mean,0.991368776914382,0.0,0
smollm2-135m,v_l_non_param_lda_diff,0.004342480440957698,6.2835872740427154e-15,0.7798120745299347
smollm2-135m,v_l_non_param_diff,0.002698104155848255,3.2731004999774603e-10,0.6285257814112526
smollm2-135m,v_l_non_param_diff_sims,0.006100240084242468,2.5758982122910713e-96,8.904622298587222
smollm2-135m,v_l_sampled_rsa_mean,0.9872498988232659,0,0
smollm2-135m,v_l_sampled_rsa_sd,0.0016791221368218144,0,0
smollm2-135m,v_wn_lda_rsa_mean,0.39959616220057625,0,0
smollm2-135m,v_wn_lda_rsa_sd,0.04272099178274399,0,0
smollm2-135m,l_wn_lda_rsa_mean,0.39555895797962803,0,0
smollm2-135m,l_wn_lda_rsa_sd,0.04153612024043275,0,0
smollm2-360m,v_wn_lda,0.3940323380172261,0.0,0
smollm2-360m,v_s_wn_lda,0.1882378176383495,0.0,0
smollm2-360m,v_wn_mean,0.3685296663800727,0.0,0
smollm2-360m,v_s_wn_mean,0.18741721195427702,0.0,0
smollm2-360m,l_wn_lda,0.39379959352404825,0.0,0
smollm2-360m,l_s_wn_lda,0.19987375202007185,0.0,0
smollm2-360m,l_wn_mean,0.3689084310198026,0.0,0
smollm2-360m,l_s_wn_mean,0.1998757654780752,0.0,0
smollm2-360m,v_l_lda,0.9924821276757121,0.0,0
smollm2-360m,v_l_mean,0.9949306121088812,0.0,0
smollm2-360m,v_l_non_param_lda_diff,0.00022844882953482637,0.4053668309798979,0.08320746121527522
smollm2-360m,v_l_non_param_diff,-0.0007815136574061865,0.00810869304206474,0.26475101295769393
smollm2-360m,v_l_non_param_diff_sims,0.004112555195129536,1.9079306482478983e-93,8.322344217761595
smollm2-360m,v_l_sampled_rsa_mean,0.9922514029178228,0,0
smollm2-360m,v_l_sampled_rsa_sd,0.0009907778926004911,0,0
smollm2-360m,v_wn_lda_rsa_mean,0.39486178483941076,0,0
smollm2-360m,v_wn_lda_rsa_sd,0.03824998378610257,0,0
smollm2-360m,l_wn_lda_rsa_mean,0.3864789267012543,0,0
smollm2-360m,l_wn_lda_rsa_sd,0.0402139738039413,0,0
smollm2-1.7b,v_wn_lda,0.3818578997554093,0.0,0
smollm2-1.7b,v_s_wn_lda,0.20679203884517425,0.0,0
smollm2-1.7b,v_wn_mean,0.36164601336721103,0.0,0
smollm2-1.7b,v_s_wn_mean,0.20734564900840413,0.0,0
smollm2-1.7b,l_wn_lda,0.38611258988519853,0.0,0
smollm2-1.7b,l_s_wn_lda,0.21757410875185107,0.0,0
smollm2-1.7b,l_wn_mean,0.366158222410565,0.0,0
smollm2-1.7b,l_s_wn_mean,0.2191723611213441,0.0,0
smollm2-1.7b,v_l_lda,0.9961053857252181,0.0,0
smollm2-1.7b,v_l_mean,0.996693264807232,0.0,0
smollm2-1.7b,v_l_non_param_lda_diff,-0.0042778737848253,7.333806979251821e-18,0.8609565408390463
smollm2-1.7b,v_l_non_param_diff,-0.00489949559605448,4.0161556854627e-18,0.8678331905262591
smollm2-1.7b,v_l_non_param_diff_sims,0.0019520983250919943,2.226406640706063e-91,7.926037612407708
smollm2-1.7b,v_l_sampled_rsa_mean,0.9960689907570816,0,0
smollm2-1.7b,v_l_sampled_rsa_sd,0.0004465569733920155,0,0
smollm2-1.7b,v_wn_lda_rsa_mean,0.37948341030044547,0,0
smollm2-1.7b,v_wn_lda_rsa_sd,0.04046787661879075,0,0
smollm2-1.7b,l_wn_lda_rsa_mean,0.3884194622139019,0,0
smollm2-1.7b,l_wn_lda_rsa_sd,0.04106982740339209,0,0
