skill,score,count,avg
robustness,42.0,13,3.230769230769231
correctness,62.0,27,2.2962962962962963
efficiency,57.0,15,3.8
factuality,85.0,27,3.1481481481481484
commonsense,127.0,39,3.2564102564102564
comprehension,205.0,59,3.4745762711864407
insightfulness,41.0,12,3.4166666666666665
completeness,63.0,18,3.5
metacognition,60.0,19,3.1578947368421053
readability,57.0,12,4.75
conciseness,55.0,12,4.583333333333333
harmlessness,50.0,12,4.166666666666667
