skill,score,count,avg,normalize
robustness,25.0,19,1.3157894736842106,6.2631578947368425
correctness,85.0,50,1.7,7.8
efficiency,39.0,20,1.95,8.8
factuality,103.0,44,2.340909090909091,10.363636363636363
commonsense,108.0,51,2.1176470588235294,9.470588235294118
comprehension,219.0,99,2.212121212121212,9.848484848484848
insightfulness,27.0,12,2.25,10.0
completeness,62.5,29,2.1551724137931036,9.620689655172415
metacognition,41.0,21,1.9523809523809523,8.80952380952381
readability,54.0,14,3.857142857142857,16.42857142857143
conciseness,64.0,19,3.3684210526315788,14.473684210526315
harmlessness,61.0,25,2.44,10.76
