skill,score,count,avg,normalize
robustness,5.0,19,0.2631578947368421,2.052631578947368
correctness,11.0,50,0.22,1.88
efficiency,9.0,20,0.45,2.8
factuality,20.0,44,0.45454545454545453,2.8181818181818183
commonsense,25.0,51,0.49019607843137253,2.9607843137254903
comprehension,42.0,99,0.42424242424242425,2.6969696969696972
insightfulness,4.0,12,0.3333333333333333,2.333333333333333
completeness,9.0,29,0.3103448275862069,2.2413793103448274
metacognition,16.0,21,0.7619047619047619,4.0476190476190474
readability,12.0,14,0.8571428571428571,4.428571428571429
conciseness,13.0,19,0.6842105263157895,3.736842105263158
harmlessness,22.0,25,0.88,4.52
