skill,score,count,avg
robustness,27.0,13,2.076923076923077
correctness,46.0,27,1.7037037037037037
efficiency,60.0,16,3.75
factuality,77.0,26,2.9615384615384617
commonsense,112.0,40,2.8
comprehension,184.0,59,3.1186440677966103
insightfulness,40.0,12,3.3333333333333335
completeness,63.0,18,3.5
metacognition,72.0,19,3.789473684210526
readability,54.0,12,4.5
conciseness,57.0,12,4.75
harmlessness,60.0,12,5.0
