skill,score,count,avg,normalize
robustness,9.0,18,0.5,3.0
correctness,13.0,50,0.26,2.04
efficiency,12.0,20,0.6,3.4
factuality,15.0,44,0.3409090909090909,2.3636363636363633
commonsense,24.0,51,0.47058823529411764,2.8823529411764706
comprehension,52.0,99,0.5252525252525253,3.101010101010101
insightfulness,4.0,12,0.3333333333333333,2.333333333333333
completeness,9.0,29,0.3103448275862069,2.2413793103448274
metacognition,12.0,21,0.5714285714285714,3.2857142857142856
readability,12.0,14,0.8571428571428571,4.428571428571429
conciseness,10.0,19,0.5263157894736842,3.1052631578947367
harmlessness,19.0,25,0.76,4.04
