skill,score,count,avg,normalize
robustness,41.0,19,2.1578947368421053,9.631578947368421
correctness,107.0,50,2.14,9.56
efficiency,49.0,20,2.45,10.8
factuality,115.0,44,2.6136363636363638,11.454545454545455
commonsense,130.0,51,2.549019607843137,11.196078431372548
comprehension,284.0,99,2.8686868686868685,12.474747474747474
insightfulness,40.0,12,3.3333333333333335,14.333333333333334
completeness,82.0,29,2.8275862068965516,12.310344827586206
metacognition,74.0,21,3.5238095238095237,15.095238095238095
readability,55.0,14,3.9285714285714284,16.714285714285715
conciseness,69.0,19,3.6315789473684212,15.526315789473685
harmlessness,98.0,25,3.92,16.68
