skill,score,count,avg,normalize
robustness,52.0,19,2.736842105263158,11.947368421052632
correctness,146.0,50,2.92,12.68
efficiency,63.0,20,3.15,13.6
factuality,129.0,44,2.9318181818181817,12.727272727272727
commonsense,171.0,51,3.3529411764705883,14.411764705882353
comprehension,285.0,99,2.878787878787879,12.515151515151516
insightfulness,44.0,12,3.6666666666666665,15.666666666666666
completeness,83.0,29,2.8620689655172415,12.448275862068966
metacognition,81.0,21,3.857142857142857,16.42857142857143
readability,57.0,14,4.071428571428571,17.285714285714285
conciseness,69.0,19,3.6315789473684212,15.526315789473685
harmlessness,112.0,25,4.48,18.92
