skill,score,count,avg
robustness,27.0,13,2.076923076923077
correctness,43.0,27,1.5925925925925926
efficiency,48.0,16,3.0
factuality,62.0,25,2.48
commonsense,100.0,40,2.5
comprehension,161.0,59,2.7288135593220337
insightfulness,27.0,12,2.25
completeness,46.0,18,2.5555555555555554
metacognition,42.0,19,2.210526315789474
readability,54.0,12,4.5
conciseness,55.0,12,4.583333333333333
harmlessness,34.0,12,2.8333333333333335
