skill,score,count,avg,normalize
robustness,41.0,19,2.1578947368421053,9.631578947368421
correctness,94.0,50,1.88,8.52
efficiency,58.0,20,2.9,12.6
factuality,117.0,44,2.659090909090909,11.636363636363637
commonsense,141.0,51,2.764705882352941,12.058823529411764
comprehension,262.0,99,2.6464646464646466,11.585858585858587
insightfulness,35.0,12,2.9166666666666665,12.666666666666666
completeness,87.0,29,3.0,13.0
metacognition,64.0,21,3.0476190476190474,13.19047619047619
readability,55.0,14,3.9285714285714284,16.714285714285715
conciseness,60.0,19,3.1578947368421053,13.631578947368421
harmlessness,112.0,25,4.48,18.92
