skill,score,count,avg,normalize
robustness,6.0,19,0.3157894736842105,2.263157894736842
correctness,12.0,49,0.24489795918367346,1.9795918367346939
efficiency,6.0,20,0.3,2.2
factuality,18.0,43,0.4186046511627907,2.674418604651163
commonsense,25.0,51,0.49019607843137253,2.9607843137254903
comprehension,45.0,99,0.45454545454545453,2.8181818181818183
insightfulness,7.0,12,0.5833333333333334,3.3333333333333335
completeness,14.0,29,0.4827586206896552,2.931034482758621
metacognition,12.0,21,0.5714285714285714,3.2857142857142856
readability,11.0,14,0.7857142857142857,4.142857142857142
conciseness,12.0,19,0.631578947368421,3.526315789473684
harmlessness,18.0,25,0.72,3.88
