experiment,task,path,total,correct,top2_correct,accuracy,top2_accuracy,rms_error
gpt-4o_4options_20250318_070420,text2image_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gpt-4o_4options_20250318_070420/results.csv,44,38,39,0.8636363636363636,0.8863636363636364,0.40501122318905053
gpt-4o_4options_20250318_070520,text2image_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gpt-4o_4options_20250318_070520/results.csv,93,75,87,0.8064516129032258,0.9354838709677419,0.4249920935380945
gemini-1.5-pro_4options_20250318_070420,text2image_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gemini-1.5-pro_4options_20250318_070420/results.csv,66,51,56,0.7727272727272727,0.8484848484848485,0.47899199714956964
gpt-4o_4options_20250318_070220,image2text_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gpt-4o_4options_20250318_070220/results.csv,797,605,690,0.7590966122961104,0.8657465495608532,0.4714947266829576
gpt-4o_4options_20250318_070320,image2text_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gpt-4o_4options_20250318_070320/results.csv,834,620,707,0.7434052757793765,0.8477218225419664,0.4856401989927294
gemini-1.5-pro_4options_20250318_070220,image2text_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gemini-1.5-pro_4options_20250318_070220/results.csv,864,630,729,0.7291666666666666,0.84375,0.5094146059358141
qwen-vl-max_4options_20250318_070420,text2image_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen-vl-max_4options_20250318_070420/results.csv,125,91,107,0.728,0.856,0.5814292734288496
step-1o-turbo-vision_4options_20250318_070520,text2image_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1o-turbo-vision_4options_20250318_070520/results.csv,259,186,218,0.7181467181467182,0.8416988416988417,0.517064031194602
step-1o-turbo-vision_4options_20250318_070220,image2text_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1o-turbo-vision_4options_20250318_070220/results.csv,1942,1387,1619,0.7142121524201854,0.833676622039135,0.5163981949789803
step-1o-turbo-vision_4options_20250318_070420,text2image_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1o-turbo-vision_4options_20250318_070420/results.csv,274,195,230,0.7116788321167883,0.8394160583941606,0.5391514690412548
gemini-1.5-pro_4options_20250318_070320,image2text_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gemini-1.5-pro_4options_20250318_070320/results.csv,890,622,731,0.698876404494382,0.8213483146067416,0.5336191883752375
qwen-vl-max_4options_20250318_070320,image2text_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen-vl-max_4options_20250318_070320/results.csv,1785,1241,1487,0.6952380952380952,0.8330532212885154,0.5833960270431638
qwen-vl-max_4options_20250318_070220,image2text_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen-vl-max_4options_20250318_070220/results.csv,1761,1222,1433,0.693923906871096,0.8137421919363997,0.5776784393846859
step-1o-turbo-vision_4options_20250318_070320,image2text_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1o-turbo-vision_4options_20250318_070320/results.csv,2061,1423,1693,0.6904415332362931,0.8214459000485201,0.52866750001311
step-1v-8k_4options_20250318_070320,image2text_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1v-8k_4options_20250318_070320/results.csv,1340,921,1060,0.6873134328358209,0.7910447761194029,0.5370697167007418
gemini-1.5-pro_4options_20250318_070520,text2image_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/gemini-1.5-pro_4options_20250318_070520/results.csv,72,49,61,0.6805555555555556,0.8472222222222222,0.5596142024248094
step-1v-8k_4options_20250318_070220,image2text_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1v-8k_4options_20250318_070220/results.csv,1682,1142,1316,0.6789536266349584,0.7824019024970273,0.5484314337067961
qwen-vl-max_4options_20250318_070520,text2image_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen-vl-max_4options_20250318_070520/results.csv,143,97,118,0.6783216783216783,0.8251748251748252,0.5646491577330752
step-1v-8k_4options_20250318_070420,text2image_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1v-8k_4options_20250318_070420/results.csv,215,143,164,0.6651162790697674,0.7627906976744186,0.5430473875420809
step-1v-8k_4options_20250318_070520,text2image_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/step-1v-8k_4options_20250318_070520/results.csv,211,140,166,0.6635071090047393,0.7867298578199052,0.5488920335138563
qwen2.5-vl-7b-instruct_4options_20250318_070520,text2image_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen2.5-vl-7b-instruct_4options_20250318_070520/results.csv,116,74,89,0.6379310344827587,0.7672413793103449,0.5685924848194034
ernie-4.5-8k-preview_4options_20250318_070320,image2text_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/ernie-4.5-8k-preview_4options_20250318_070320/results.csv,618,380,478,0.6148867313915858,0.7734627831715211,0.5897862426282229
qwen2.5-vl-7b-instruct_4options_20250318_070320,image2text_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen2.5-vl-7b-instruct_4options_20250318_070320/results.csv,1875,1125,1413,0.6,0.7536,0.5938608591244249
qwen2.5-vl-7b-instruct_4options_20250318_070220,image2text_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen2.5-vl-7b-instruct_4options_20250318_070220/results.csv,1903,1126,1409,0.5916973200210195,0.7404098791382029,0.6019807033532462
ernie-4.5-8k-preview_4options_20250318_070420,text2image_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/ernie-4.5-8k-preview_4options_20250318_070420/results.csv,108,63,78,0.5833333333333334,0.7222222222222222,0.6284269013738754
ernie-4.5-8k-preview_4options_20250318_070520,text2image_option,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/ernie-4.5-8k-preview_4options_20250318_070520/results.csv,121,70,95,0.5785123966942148,0.7851239669421488,0.6082665004693423
ernie-4.5-8k-preview_4options_20250318_070220,image2text_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/ernie-4.5-8k-preview_4options_20250318_070220/results.csv,541,307,396,0.5674676524953789,0.7319778188539742,0.6310344176264914
qwen2.5-vl-7b-instruct_4options_20250318_070420,text2image_given,/home/ubuntu/scratch/mhjiang/CNS_cover/experiment/results/understanding/qwen2.5-vl-7b-instruct_4options_20250318_070420/results.csv,105,59,80,0.5619047619047619,0.7619047619047619,0.6121391065062628
