skill,score,count,avg,normalize
robustness,5.0,19,0.2631578947368421,2.052631578947368
correctness,8.0,50,0.16,1.6400000000000001
efficiency,8.0,20,0.4,2.6
factuality,17.0,44,0.38636363636363635,2.5454545454545454
commonsense,24.0,51,0.47058823529411764,2.8823529411764706
comprehension,41.0,99,0.41414141414141414,2.6565656565656566
insightfulness,2.0,12,0.16666666666666666,1.6666666666666665
completeness,12.0,29,0.41379310344827586,2.655172413793103
metacognition,15.0,21,0.7142857142857143,3.857142857142857
readability,12.0,14,0.8571428571428571,4.428571428571429
conciseness,9.0,19,0.47368421052631576,2.894736842105263
harmlessness,24.0,25,0.96,4.84
