model_id,problem_id,category,subcategory,self_eval_answer,self_eval_correct,self_eval_confidence,judge_a_answer,judge_a_confidence,judge_b_answer,judge_b_confidence,judge_c_answer,judge_c_confidence,correct_answer
Qwen2.5-7B,arithmetic_basic_operations_e1,arithmetic,basic operations,A,0.0,0.9,B,0.75,A,0.95,B,0.9,A
Qwen2.5-7B,arithmetic_basic_operations_e2,arithmetic,basic operations,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
Qwen2.5-7B,arithmetic_basic_operations_e3,arithmetic,basic operations,B,1.0,0.9,B,0.9,B,0.95,B,1.0,B
Qwen2.5-7B,arithmetic_basic_operations_m1,arithmetic,basic operations,A,0.0,0.9,B,0.98,B,0.95,B,1.0,A
Qwen2.5-7B,arithmetic_basic_operations_m2,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Qwen2.5-7B,arithmetic_basic_operations_m3,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_basic_operations_h1,arithmetic,basic operations,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_basic_operations_h2,arithmetic,basic operations,A,0.0,0.9,B,0.85,A,0.95,B,1.0,A
Qwen2.5-7B,arithmetic_basic_operations_h3,arithmetic,basic operations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_fractions_e1,arithmetic,fractions,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_fractions_e2,arithmetic,fractions,A,0.0,0.85,B,0.95,A,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_fractions_e3,arithmetic,fractions,A,1.0,0.95,A,0.85,A,0.95,A,0.9,A
Qwen2.5-7B,arithmetic_fractions_m1,arithmetic,fractions,A,0.0,0.85,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,arithmetic_fractions_m2,arithmetic,fractions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_fractions_m3,arithmetic,fractions,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B,arithmetic_fractions_h1,arithmetic,fractions,A,0.0,0.95,B,0.9,A,0.95,B,1.0,A
Qwen2.5-7B,arithmetic_fractions_h2,arithmetic,fractions,A,0.0,0.9,B,1.0,B,0.98,B,1.0,A
Qwen2.5-7B,arithmetic_fractions_h3,arithmetic,fractions,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
Qwen2.5-7B,arithmetic_percentages_e1,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,arithmetic_percentages_e2,arithmetic,percentages,A,0.0,0.9,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,arithmetic_percentages_e3,arithmetic,percentages,A,0.0,0.9,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B,arithmetic_percentages_m1,arithmetic,percentages,A,1.0,0.85,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,arithmetic_percentages_m2,arithmetic,percentages,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_percentages_m3,arithmetic,percentages,A,1.0,0.85,A,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_percentages_h1,arithmetic,percentages,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_percentages_h2,arithmetic,percentages,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_percentages_h3,arithmetic,percentages,A,1.0,0.95,A,0.9,A,0.95,A,0.9,A
Qwen2.5-7B,arithmetic_numerical_e1,arithmetic,numerical approximation,B,1.0,1.0,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_numerical_e2,arithmetic,numerical approximation,A,0.0,0.9,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_numerical_e3,arithmetic,numerical approximation,A,0.0,0.85,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_numerical_m1,arithmetic,numerical approximation,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,arithmetic_numerical_m2,arithmetic,numerical approximation,A,1.0,0.9,A,0.85,A,0.9,B,0.95,A
Qwen2.5-7B,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,0.9,A,1.0,A,1.0,A,1.0,A
Qwen2.5-7B,arithmetic_numerical_h1,arithmetic,numerical approximation,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_numerical_h2,arithmetic,numerical approximation,A,1.0,0.8,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,arithmetic_numerical_h3,arithmetic,numerical approximation,B,1.0,0.95,B,0.85,A,0.95,B,0.9,A
Qwen2.5-7B,arithmetic_order_e1,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_order_e2,arithmetic,order of operations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_order_e3,arithmetic,order of operations,A,0.0,1.0,B,0.95,A,0.95,B,0.95,B
Qwen2.5-7B,arithmetic_order_m1,arithmetic,order of operations,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_order_m2,arithmetic,order of operations,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,arithmetic_order_m3,arithmetic,order of operations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,arithmetic_order_h1,arithmetic,order of operations,A,0.0,0.9,B,1.0,B,1.0,B,1.0,B
Qwen2.5-7B,arithmetic_order_h2,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Qwen2.5-7B,arithmetic_order_h3,arithmetic,order of operations,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_equations_e1,algebra,equations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_equations_e2,algebra,equations,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,algebra_equations_e3,algebra,equations,A,0.0,0.85,B,0.75,A,0.95,B,0.95,B
Qwen2.5-7B,algebra_equations_m1,algebra,equations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,algebra_equations_m2,algebra,equations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_equations_m3,algebra,equations,A,0.0,0.9,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,algebra_equations_h1,algebra,equations,A,0.0,0.9,B,0.9,B,0.95,B,0.95,A
Qwen2.5-7B,algebra_equations_h2,algebra,equations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,algebra_equations_h3,algebra,equations,A,1.0,1.0,A,0.95,A,0.85,A,0.9,A
Qwen2.5-7B,algebra_inequalities_e1,algebra,inequalities,B,0.0,0.95,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,algebra_inequalities_e2,algebra,inequalities,A,1.0,0.95,A,1.0,A,0.99,A,1.0,A
Qwen2.5-7B,algebra_inequalities_e3,algebra,inequalities,B,1.0,0.9,B,0.9,A,0.95,B,0.9,B
Qwen2.5-7B,algebra_inequalities_m1,algebra,inequalities,A,1.0,0.95,A,1.0,A,1.0,A,1.0,A
Qwen2.5-7B,algebra_inequalities_m2,algebra,inequalities,A,1.0,0.9,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_inequalities_m3,algebra,inequalities,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_inequalities_h1,algebra,inequalities,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_inequalities_h2,algebra,inequalities,A,0.0,0.9,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,algebra_inequalities_h3,algebra,inequalities,A,1.0,0.9,A,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,algebra_polynomials_e1,algebra,polynomials,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,algebra_polynomials_e2,algebra,polynomials,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_polynomials_e3,algebra,polynomials,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_polynomials_m1,algebra,polynomials,A,0.0,0.95,A,0.6,B,0.9,B,1.0,B
Qwen2.5-7B,algebra_polynomials_m2,algebra,polynomials,A,1.0,0.9,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_polynomials_m3,algebra,polynomials,A,1.0,0.85,B,0.9,A,0.9,A,1.0,B
Qwen2.5-7B,algebra_polynomials_h1,algebra,polynomials,A,0.0,0.95,B,0.75,A,0.95,B,0.95,A
Qwen2.5-7B,algebra_polynomials_h2,algebra,polynomials,A,1.0,0.9,A,0.55,A,0.98,B,0.95,B
Qwen2.5-7B,algebra_polynomials_h3,algebra,polynomials,A,1.0,0.95,B,0.6,A,0.7,A,0.8,A
Qwen2.5-7B,algebra_functions_e1,algebra,functions,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,algebra_functions_e2,algebra,functions,A,0.0,0.9,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,algebra_functions_e3,algebra,functions,A,1.0,0.95,A,0.55,A,0.95,A,0.95,B
Qwen2.5-7B,algebra_functions_m1,algebra,functions,A,0.0,0.95,B,0.95,B,0.95,B,1.0,A
Qwen2.5-7B,algebra_functions_m2,algebra,functions,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_functions_m3,algebra,functions,A,0.0,0.95,B,0.9,B,0.95,B,0.95,A
Qwen2.5-7B,algebra_functions_h1,algebra,functions,A,0.0,0.9,B,0.85,B,0.9,,,A
Qwen2.5-7B,algebra_functions_h2,algebra,functions,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,algebra_functions_h3,algebra,functions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_systems_e1,algebra,systems of equations,A,1.0,0.9,A,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,algebra_systems_e2,algebra,systems of equations,A,0.0,0.8,B,0.95,B,0.9,B,1.0,B
Qwen2.5-7B,algebra_systems_e3,algebra,systems of equations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,algebra_systems_m1,algebra,systems of equations,A,1.0,0.9,A,0.95,B,0.7,A,1.0,A
Qwen2.5-7B,algebra_systems_m2,algebra,systems of equations,A,1.0,0.9,A,0.6,B,0.95,A,0.95,B
Qwen2.5-7B,algebra_systems_m3,algebra,systems of equations,A,0.0,0.8,B,0.95,B,0.95,B,1.0,A
Qwen2.5-7B,algebra_systems_h1,algebra,systems of equations,A,0.0,1.0,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B,algebra_systems_h2,algebra,systems of equations,A,0.0,1.0,B,0.95,B,0.98,B,1.0,B
Qwen2.5-7B,algebra_systems_h3,algebra,systems of equations,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
Qwen2.5-7B,calculus_differentiation_e1,calculus,differentiation,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,calculus_differentiation_e2,calculus,differentiation,A,1.0,0.95,A,0.9,A,0.98,A,0.95,B
Qwen2.5-7B,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,calculus_differentiation_m1,calculus,differentiation,A,1.0,0.9,A,0.51,A,0.95,A,0.95,B
Qwen2.5-7B,calculus_differentiation_m2,calculus,differentiation,A,1.0,0.9,A,0.85,A,1.0,A,0.95,A
Qwen2.5-7B,calculus_differentiation_m3,calculus,differentiation,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
Qwen2.5-7B,calculus_differentiation_h1,calculus,differentiation,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,calculus_differentiation_h2,calculus,differentiation,A,1.0,0.8,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,calculus_differentiation_h3,calculus,differentiation,A,0.0,0.9,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,calculus_integration_e1,calculus,integration,A,1.0,0.9,A,1.0,A,1.0,A,1.0,A
Qwen2.5-7B,calculus_integration_e2,calculus,integration,A,0.0,0.9,B,0.85,B,0.95,B,1.0,B
Qwen2.5-7B,calculus_integration_e3,calculus,integration,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,calculus_integration_m1,calculus,integration,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,calculus_integration_m2,calculus,integration,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,calculus_integration_m3,calculus,integration,A,0.0,0.9,B,0.95,B,0.98,B,0.95,A
Qwen2.5-7B,calculus_integration_h1,calculus,integration,A,1.0,0.95,A,1.0,A,0.99,A,1.0,A
Qwen2.5-7B,calculus_integration_h2,calculus,integration,A,0.0,0.85,B,1.0,B,0.98,B,1.0,A
Qwen2.5-7B,calculus_integration_h3,calculus,integration,B,1.0,0.95,B,0.85,B,0.9,B,0.8,A
Qwen2.5-7B,calculus_limits_e1,calculus,limits,A,1.0,0.8,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,calculus_limits_e2,calculus,limits,A,0.0,0.95,B,0.92,B,0.95,B,0.95,A
Qwen2.5-7B,calculus_limits_e3,calculus,limits,A,0.0,1.0,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,calculus_limits_m1,calculus,limits,A,0.0,0.9,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,calculus_limits_m2,calculus,limits,B,1.0,0.9,B,0.75,A,0.95,B,0.9,A
Qwen2.5-7B,calculus_limits_m3,calculus,limits,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,calculus_limits_h1,calculus,limits,A,0.0,0.95,A,0.6,B,0.95,B,0.95,A
Qwen2.5-7B,calculus_limits_h2,calculus,limits,A,0.0,0.85,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,calculus_limits_h3,calculus,limits,A,1.0,0.9,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B,calculus_series_e1,calculus,series,A,0.0,0.9,B,0.75,B,0.95,B,0.95,B
Qwen2.5-7B,calculus_series_e2,calculus,series,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,calculus_series_e3,calculus,series,A,0.0,0.9,B,0.85,A,0.95,B,0.9,A
Qwen2.5-7B,calculus_series_m1,calculus,series,A,0.0,0.9,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,calculus_series_m2,calculus,series,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
Qwen2.5-7B,calculus_series_m3,calculus,series,A,0.0,0.75,B,0.9,B,0.98,B,0.95,B
Qwen2.5-7B,calculus_series_h1,calculus,series,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
Qwen2.5-7B,calculus_series_h2,calculus,series,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,calculus_series_h3,calculus,series,A,1.0,1.0,A,0.95,A,0.98,A,1.0,A
Qwen2.5-7B,calculus_applications_e1,calculus,applications,A,0.0,0.9,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,calculus_applications_e2,calculus,applications,A,1.0,1.0,A,0.75,A,0.95,A,0.95,B
Qwen2.5-7B,calculus_applications_e3,calculus,applications,A,1.0,0.9,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B,calculus_applications_m1,calculus,applications,A,0.0,0.85,B,0.85,B,0.98,B,0.95,B
Qwen2.5-7B,calculus_applications_m2,calculus,applications,A,0.0,0.95,A,0.75,B,0.95,B,0.9,B
Qwen2.5-7B,calculus_applications_m3,calculus,applications,A,0.0,0.85,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,calculus_applications_h1,calculus,applications,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,calculus_applications_h2,calculus,applications,A,0.0,0.9,B,0.95,A,0.95,B,0.9,A
Qwen2.5-7B,calculus_applications_h3,calculus,applications,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_plane_e1,geometry,plane geometry,A,0.0,0.95,B,0.98,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_plane_e2,geometry,plane geometry,A,1.0,0.9,A,1.0,A,0.95,A,1.0,B
Qwen2.5-7B,geometry_plane_e3,geometry,plane geometry,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,geometry_plane_m1,geometry,plane geometry,A,0.0,0.9,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_plane_m2,geometry,plane geometry,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_plane_m3,geometry,plane geometry,A,0.0,0.9,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_plane_h1,geometry,plane geometry,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_plane_h2,geometry,plane geometry,A,1.0,1.0,A,0.98,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_plane_h3,geometry,plane geometry,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_coordinate_e1,geometry,coordinate geometry,A,0.0,1.0,B,0.65,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_coordinate_e2,geometry,coordinate geometry,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_coordinate_e3,geometry,coordinate geometry,A,0.0,0.9,B,0.95,B,0.98,B,0.95,A
Qwen2.5-7B,geometry_coordinate_m1,geometry,coordinate geometry,A,0.0,0.9,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_coordinate_m2,geometry,coordinate geometry,A,0.0,0.9,B,0.95,B,0.98,B,1.0,B
Qwen2.5-7B,geometry_coordinate_m3,geometry,coordinate geometry,A,1.0,0.9,A,0.85,B,0.95,A,0.95,B
Qwen2.5-7B,geometry_coordinate_h1,geometry,coordinate geometry,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_coordinate_h2,geometry,coordinate geometry,A,1.0,1.0,B,0.9,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_coordinate_h3,geometry,coordinate geometry,A,0.0,0.95,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B,geometry_transformations_e1,geometry,transformations,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_transformations_e2,geometry,transformations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_transformations_e3,geometry,transformations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_transformations_m1,geometry,transformations,A,1.0,0.9,A,0.85,A,0.95,B,0.85,A
Qwen2.5-7B,geometry_transformations_m2,geometry,transformations,A,1.0,0.85,A,1.0,A,0.95,A,1.0,A
Qwen2.5-7B,geometry_transformations_m3,geometry,transformations,A,1.0,0.85,A,0.6,A,0.95,A,0.95,A
Qwen2.5-7B,geometry_transformations_h1,geometry,transformations,A,1.0,0.9,A,0.75,A,0.95,B,0.95,B
Qwen2.5-7B,geometry_transformations_h2,geometry,transformations,A,1.0,1.0,B,0.95,A,0.95,,,B
Qwen2.5-7B,geometry_transformations_h3,geometry,transformations,A,0.0,0.9,B,1.0,B,0.95,B,1.0,B
Qwen2.5-7B,geometry_mensuration_e1,geometry,mensuration,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B,geometry_mensuration_e2,geometry,mensuration,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,geometry_mensuration_e3,geometry,mensuration,A,1.0,0.95,B,0.85,A,1.0,A,0.95,A
Qwen2.5-7B,geometry_mensuration_m1,geometry,mensuration,A,0.0,0.9,B,1.0,B,0.99,B,1.0,A
Qwen2.5-7B,geometry_mensuration_m2,geometry,mensuration,A,1.0,0.9,A,0.95,A,0.95,A,1.0,B
Qwen2.5-7B,geometry_mensuration_m3,geometry,mensuration,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_mensuration_h1,geometry,mensuration,B,1.0,0.95,B,0.95,B,0.98,B,1.0,A
Qwen2.5-7B,geometry_mensuration_h2,geometry,mensuration,A,0.0,0.9,B,0.85,B,0.95,,,B
Qwen2.5-7B,geometry_mensuration_h3,geometry,mensuration,B,1.0,0.95,B,0.6,B,0.5,,,B
Qwen2.5-7B,geometry_trigonometry_e1,geometry,trigonometry,A,0.0,0.9,B,0.75,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_trigonometry_e2,geometry,trigonometry,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,geometry_trigonometry_e3,geometry,trigonometry,A,1.0,1.0,A,0.8,A,0.95,B,0.95,A
Qwen2.5-7B,geometry_trigonometry_m1,geometry,trigonometry,B,1.0,0.95,B,0.95,B,0.98,B,0.95,B
Qwen2.5-7B,geometry_trigonometry_m2,geometry,trigonometry,A,1.0,0.85,A,0.85,A,0.95,A,0.9,B
Qwen2.5-7B,geometry_trigonometry_m3,geometry,trigonometry,A,1.0,0.9,A,0.6,A,0.95,B,0.95,A
Qwen2.5-7B,geometry_trigonometry_h1,geometry,trigonometry,B,1.0,0.95,B,0.95,B,0.9,B,1.0,A
Qwen2.5-7B,geometry_trigonometry_h2,geometry,trigonometry,A,1.0,0.85,B,0.6,A,0.65,,,A
Qwen2.5-7B,geometry_trigonometry_h3,geometry,trigonometry,B,1.0,0.85,B,0.95,B,0.95,B,0.8,A
Qwen2.5-7B,numbertheory_divisibility_e1,number theory,divisibility,A,1.0,0.9,A,1.0,A,0.95,A,1.0,A
Qwen2.5-7B,numbertheory_divisibility_e2,number theory,divisibility,A,0.0,0.85,B,1.0,B,0.98,B,0.95,A
Qwen2.5-7B,numbertheory_divisibility_e3,number theory,divisibility,A,1.0,0.9,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,numbertheory_divisibility_m1,number theory,divisibility,A,0.0,0.85,B,0.95,B,0.95,A,0.95,B
Qwen2.5-7B,numbertheory_divisibility_m2,number theory,divisibility,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,numbertheory_divisibility_m3,number theory,divisibility,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,numbertheory_divisibility_h1,number theory,divisibility,A,0.0,1.0,B,0.55,A,0.95,B,0.95,B
Qwen2.5-7B,numbertheory_divisibility_h2,number theory,divisibility,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B,numbertheory_divisibility_h3,number theory,divisibility,A,1.0,0.9,A,0.9,B,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_modular_e1,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Qwen2.5-7B,numbertheory_modular_e2,number theory,modular arithmetic,A,0.0,0.8,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,numbertheory_modular_e3,number theory,modular arithmetic,A,1.0,0.85,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,numbertheory_modular_m1,number theory,modular arithmetic,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,numbertheory_modular_m2,number theory,modular arithmetic,A,1.0,1.0,B,0.55,A,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_modular_m3,number theory,modular arithmetic,A,0.0,0.85,B,0.95,B,0.95,B,1.0,A
Qwen2.5-7B,numbertheory_modular_h1,number theory,modular arithmetic,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_modular_h2,number theory,modular arithmetic,A,0.0,0.85,B,0.8,B,0.85,B,0.8,B
Qwen2.5-7B,numbertheory_modular_h3,number theory,modular arithmetic,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
Qwen2.5-7B,numbertheory_primes_e1,number theory,primes,A,1.0,0.9,A,0.85,B,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_primes_e2,number theory,primes,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_primes_e3,number theory,primes,B,0.0,0.9,A,0.95,B,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_primes_m1,number theory,primes,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,numbertheory_primes_m2,number theory,primes,B,0.0,1.0,A,0.95,B,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_primes_m3,number theory,primes,A,0.0,0.8,B,0.9,B,0.95,B,0.95,A
Qwen2.5-7B,numbertheory_primes_h1,number theory,primes,A,1.0,0.95,A,0.75,A,0.95,B,0.95,B
Qwen2.5-7B,numbertheory_primes_h2,number theory,primes,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_primes_h3,number theory,primes,B,0.0,0.95,A,1.0,A,0.95,A,1.0,A
Qwen2.5-7B,numbertheory_diophantine_e1,number theory,diophantine equations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,numbertheory_diophantine_e2,number theory,diophantine equations,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_diophantine_e3,number theory,diophantine equations,A,1.0,0.9,A,0.75,A,0.95,A,0.95,B
Qwen2.5-7B,numbertheory_diophantine_m1,number theory,diophantine equations,A,1.0,0.9,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_diophantine_m2,number theory,diophantine equations,B,1.0,0.9,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,numbertheory_diophantine_m3,number theory,diophantine equations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,numbertheory_diophantine_h1,number theory,diophantine equations,A,0.0,0.9,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B,numbertheory_diophantine_h2,number theory,diophantine equations,A,0.0,0.9,B,0.85,A,0.95,B,0.9,A
Qwen2.5-7B,numbertheory_diophantine_h3,number theory,diophantine equations,A,0.0,0.95,B,0.75,B,0.95,B,0.9,B
Qwen2.5-7B,numbertheory_sequences_e1,number theory,number sequences,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B,numbertheory_sequences_e2,number theory,number sequences,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,numbertheory_sequences_e3,number theory,number sequences,A,1.0,0.95,A,1.0,A,0.98,A,1.0,A
Qwen2.5-7B,numbertheory_sequences_m1,number theory,number sequences,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,numbertheory_sequences_m2,number theory,number sequences,B,1.0,0.95,B,0.95,B,0.98,B,1.0,B
Qwen2.5-7B,numbertheory_sequences_m3,number theory,number sequences,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,numbertheory_sequences_h1,number theory,number sequences,A,1.0,0.95,A,0.85,A,0.7,B,0.9,B
Qwen2.5-7B,numbertheory_sequences_h2,number theory,number sequences,A,1.0,0.95,A,0.75,A,0.95,A,1.0,B
Qwen2.5-7B,numbertheory_sequences_h3,number theory,number sequences,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,combinatorics_counting_e1,combinatorics,counting principles,B,1.0,1.0,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B,combinatorics_counting_e2,combinatorics,counting principles,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,combinatorics_counting_e3,combinatorics,counting principles,A,0.0,0.9,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,combinatorics_counting_m1,combinatorics,counting principles,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
Qwen2.5-7B,combinatorics_counting_m2,combinatorics,counting principles,A,0.0,1.0,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,combinatorics_counting_m3,combinatorics,counting principles,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,combinatorics_counting_h1,combinatorics,counting principles,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_counting_h2,combinatorics,counting principles,A,0.0,0.85,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,combinatorics_counting_h3,combinatorics,counting principles,A,1.0,0.95,A,0.75,A,0.85,A,0.9,B
Qwen2.5-7B,combinatorics_permutations_e1,combinatorics,permutations,A,1.0,0.8,A,0.95,B,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_permutations_e2,combinatorics,permutations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_permutations_e3,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_permutations_m1,combinatorics,permutations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,combinatorics_permutations_m2,combinatorics,permutations,A,1.0,0.8,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B,combinatorics_permutations_m3,combinatorics,permutations,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B,combinatorics_permutations_h1,combinatorics,permutations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,combinatorics_permutations_h2,combinatorics,permutations,B,1.0,0.95,B,1.0,B,1.0,B,1.0,A
Qwen2.5-7B,combinatorics_permutations_h3,combinatorics,permutations,A,1.0,0.9,A,0.6,A,0.85,A,0.7,A
Qwen2.5-7B,combinatorics_combinations_e1,combinatorics,combinations,A,1.0,0.95,A,0.8,A,0.95,A,1.0,A
Qwen2.5-7B,combinatorics_combinations_e2,combinatorics,combinations,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,combinatorics_combinations_e3,combinatorics,combinations,A,0.0,0.85,B,1.0,B,1.0,B,1.0,B
Qwen2.5-7B,combinatorics_combinations_m1,combinatorics,combinations,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
Qwen2.5-7B,combinatorics_combinations_m2,combinatorics,combinations,A,0.0,0.8,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,combinatorics_combinations_m3,combinatorics,combinations,B,1.0,0.9,B,0.55,A,0.95,B,0.95,B
Qwen2.5-7B,combinatorics_combinations_h1,combinatorics,combinations,A,0.0,0.9,B,0.9,B,0.95,B,0.95,A
Qwen2.5-7B,combinatorics_combinations_h2,combinatorics,combinations,B,1.0,0.95,B,1.0,B,1.0,B,1.0,A
Qwen2.5-7B,combinatorics_combinations_h3,combinatorics,combinations,A,1.0,0.9,A,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,combinatorics_probability_e1,combinatorics,probability,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,combinatorics_probability_e2,combinatorics,probability,A,1.0,1.0,A,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,combinatorics_probability_e3,combinatorics,probability,A,1.0,0.85,A,0.95,B,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_probability_m1,combinatorics,probability,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,combinatorics_probability_m2,combinatorics,probability,A,1.0,0.9,A,1.0,A,0.95,A,1.0,A
Qwen2.5-7B,combinatorics_probability_m3,combinatorics,probability,A,1.0,0.95,A,0.6,A,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_probability_h1,combinatorics,probability,B,1.0,1.0,B,0.85,A,0.98,B,0.95,A
Qwen2.5-7B,combinatorics_probability_h2,combinatorics,probability,B,1.0,0.8,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B,combinatorics_probability_h3,combinatorics,probability,A,1.0,0.9,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_recursion_e1,combinatorics,recursion,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,combinatorics_recursion_e2,combinatorics,recursion,A,1.0,0.9,A,1.0,A,0.98,A,1.0,A
Qwen2.5-7B,combinatorics_recursion_e3,combinatorics,recursion,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,combinatorics_recursion_m1,combinatorics,recursion,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,combinatorics_recursion_m2,combinatorics,recursion,A,0.0,0.9,B,0.95,B,0.95,B,1.0,A
Qwen2.5-7B,combinatorics_recursion_m3,combinatorics,recursion,A,0.0,1.0,B,0.9,A,0.95,B,1.0,B
Qwen2.5-7B,combinatorics_recursion_h1,combinatorics,recursion,A,1.0,0.95,B,0.85,A,0.95,A,1.0,B
Qwen2.5-7B,combinatorics_recursion_h2,combinatorics,recursion,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Qwen2.5-7B,combinatorics_recursion_h3,combinatorics,recursion,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B,statistics_descriptive_e1,statistics,descriptive statistics,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_descriptive_m1,statistics,descriptive statistics,B,1.0,0.8,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,statistics_descriptive_m2,statistics,descriptive statistics,A,0.0,0.95,A,0.85,B,0.95,B,0.9,B
Qwen2.5-7B,statistics_descriptive_m3,statistics,descriptive statistics,A,0.0,0.9,A,0.85,B,0.85,B,0.95,A
Qwen2.5-7B,statistics_descriptive_h1,statistics,descriptive statistics,A,1.0,0.9,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_descriptive_h2,statistics,descriptive statistics,B,0.0,0.85,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_descriptive_h3,statistics,descriptive statistics,A,1.0,0.95,A,0.5,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_distributions_e1,statistics,distributions,A,1.0,0.9,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_distributions_e2,statistics,distributions,A,1.0,0.9,A,0.95,A,0.95,A,1.0,B
Qwen2.5-7B,statistics_distributions_e3,statistics,distributions,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,statistics_distributions_m1,statistics,distributions,A,1.0,1.0,A,1.0,A,1.0,A,0.9,A
Qwen2.5-7B,statistics_distributions_m2,statistics,distributions,A,1.0,0.8,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_distributions_m3,statistics,distributions,A,1.0,0.85,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,statistics_distributions_h1,statistics,distributions,A,0.0,0.95,B,0.85,B,0.98,B,0.9,A
Qwen2.5-7B,statistics_distributions_h2,statistics,distributions,A,0.0,0.95,B,0.85,B,0.98,B,1.0,A
Qwen2.5-7B,statistics_distributions_h3,statistics,distributions,A,1.0,0.9,A,1.0,A,0.99,A,1.0,A
Qwen2.5-7B,statistics_hypothesis_e1,statistics,hypothesis testing,A,0.0,0.8,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,statistics_hypothesis_e2,statistics,hypothesis testing,B,1.0,0.85,A,0.65,B,0.95,B,0.9,B
Qwen2.5-7B,statistics_hypothesis_e3,statistics,hypothesis testing,A,0.0,0.9,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,statistics_hypothesis_m1,statistics,hypothesis testing,A,1.0,0.9,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B,statistics_hypothesis_m2,statistics,hypothesis testing,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Qwen2.5-7B,statistics_hypothesis_m3,statistics,hypothesis testing,A,0.0,0.6,B,0.9,B,0.75,A,0.7,A
Qwen2.5-7B,statistics_hypothesis_h1,statistics,hypothesis testing,A,0.0,0.95,B,0.9,A,0.95,B,0.9,A
Qwen2.5-7B,statistics_hypothesis_h2,statistics,hypothesis testing,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_hypothesis_h3,statistics,hypothesis testing,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_regression_e1,statistics,regression,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,statistics_regression_e2,statistics,regression,B,1.0,0.8,B,0.9,B,0.95,B,0.95,A
Qwen2.5-7B,statistics_regression_e3,statistics,regression,A,0.0,1.0,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,statistics_regression_m1,statistics,regression,A,0.0,0.9,B,1.0,B,1.0,B,1.0,B
Qwen2.5-7B,statistics_regression_m2,statistics,regression,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_regression_m3,statistics,regression,A,0.0,0.9,B,0.9,A,0.95,B,0.95,B
Qwen2.5-7B,statistics_regression_h1,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B,statistics_regression_h2,statistics,regression,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,statistics_regression_h3,statistics,regression,A,0.0,0.8,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,statistics_bayesian_e1,statistics,bayesian inference,A,0.0,0.95,B,1.0,B,0.98,B,1.0,B
Qwen2.5-7B,statistics_bayesian_e2,statistics,bayesian inference,A,0.0,0.85,B,0.9,B,0.9,B,0.95,B
Qwen2.5-7B,statistics_bayesian_e3,statistics,bayesian inference,A,1.0,0.95,A,0.85,A,0.98,A,0.95,B
Qwen2.5-7B,statistics_bayesian_m1,statistics,bayesian inference,A,1.0,1.0,B,0.6,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_bayesian_m2,statistics,bayesian inference,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,statistics_bayesian_m3,statistics,bayesian inference,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,statistics_bayesian_h1,statistics,bayesian inference,A,0.0,1.0,B,0.85,B,0.95,,,A
Qwen2.5-7B,statistics_bayesian_h2,statistics,bayesian inference,A,0.0,0.5,B,0.85,A,0.9,B,0.95,A
Qwen2.5-7B,statistics_bayesian_h3,statistics,bayesian inference,A,0.0,1.0,B,1.0,B,0.99,B,1.0,B
Qwen2.5-7B,linearalgebra_matrices_e1,linear algebra,matrices,A,1.0,0.9,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_matrices_e2,linear algebra,matrices,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_matrices_e3,linear algebra,matrices,A,0.0,0.95,B,1.0,B,0.95,B,1.0,A
Qwen2.5-7B,linearalgebra_matrices_m1,linear algebra,matrices,A,0.0,0.9,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_matrices_m2,linear algebra,matrices,A,0.0,0.9,B,0.95,A,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_matrices_m3,linear algebra,matrices,A,0.0,0.85,B,0.95,B,0.95,B,0.8,B
Qwen2.5-7B,linearalgebra_matrices_h1,linear algebra,matrices,B,1.0,0.95,B,0.75,B,0.95,B,1.0,A
Qwen2.5-7B,linearalgebra_matrices_h2,linear algebra,matrices,A,0.0,0.9,B,1.0,B,0.98,B,1.0,A
Qwen2.5-7B,linearalgebra_matrices_h3,linear algebra,matrices,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_determinants_e1,linear algebra,determinants,A,0.0,0.85,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,linearalgebra_determinants_e2,linear algebra,determinants,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B,linearalgebra_determinants_e3,linear algebra,determinants,A,1.0,0.9,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B,linearalgebra_determinants_m1,linear algebra,determinants,B,1.0,0.95,B,0.95,B,0.98,B,1.0,A
Qwen2.5-7B,linearalgebra_determinants_m2,linear algebra,determinants,A,1.0,1.0,A,0.95,A,0.95,A,0.9,A
Qwen2.5-7B,linearalgebra_determinants_m3,linear algebra,determinants,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_determinants_h1,linear algebra,determinants,A,0.0,0.9,B,0.75,B,0.9,,,B
Qwen2.5-7B,linearalgebra_determinants_h2,linear algebra,determinants,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_determinants_h3,linear algebra,determinants,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,B,1.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,A,1.0,1.0,B,0.85,A,0.95,A,0.95,B
Qwen2.5-7B,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,0.95,B,0.75,B,0.75,,,B
Qwen2.5-7B,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,A,1.0,0.85,A,1.0,A,0.95,A,1.0,A
Qwen2.5-7B,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,1.0,1.0,A,1.0,A,0.95,A,1.0,B
Qwen2.5-7B,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,A,1.0,0.95,A,0.98,A,0.98,A,1.0,A
Qwen2.5-7B,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,1.0,1.0,A,0.55,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,B,0.95,A,0.95,B
Qwen2.5-7B,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,A,1.0,0.9,A,0.95,A,0.98,A,0.95,A
Qwen2.5-7B,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,0.0,1.0,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,A,0.0,0.8,B,0.85,B,0.85,A,0.95,A
Qwen2.5-7B,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,0.0,0.85,B,0.95,A,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,A,1.0,1.0,A,0.85,A,0.9,,,A
Qwen2.5-7B,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,A,1.0,0.95,A,0.75,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,A,0.0,0.9,A,0.95,B,0.95,B,0.95,A
Qwen2.5-7B,linearalgebra_transformations_e1,linear algebra,linear transformations,A,1.0,0.9,A,0.95,A,0.95,B,0.9,A
Qwen2.5-7B,linearalgebra_transformations_e2,linear algebra,linear transformations,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B,linearalgebra_transformations_e3,linear algebra,linear transformations,A,0.0,0.85,B,0.95,B,0.98,B,0.95,A
Qwen2.5-7B,linearalgebra_transformations_m1,linear algebra,linear transformations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,B
Qwen2.5-7B,linearalgebra_transformations_m2,linear algebra,linear transformations,A,0.0,0.9,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B,linearalgebra_transformations_m3,linear algebra,linear transformations,A,1.0,1.0,A,0.55,A,0.95,A,0.95,A
Qwen2.5-7B,linearalgebra_transformations_h1,linear algebra,linear transformations,A,0.0,1.0,A,0.75,B,0.95,,,B
Qwen2.5-7B,linearalgebra_transformations_h2,linear algebra,linear transformations,A,1.0,0.85,A,1.0,A,0.95,A,1.0,B
Qwen2.5-7B,linearalgebra_transformations_h3,linear algebra,linear transformations,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_basic_operations_e1,arithmetic,basic operations,A,1.0,0.85,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_basic_operations_e2,arithmetic,basic operations,A,0.0,0.85,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_basic_operations_e3,arithmetic,basic operations,A,0.0,0.85,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_basic_operations_m1,arithmetic,basic operations,A,0.0,0.9,A,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_basic_operations_m2,arithmetic,basic operations,B,1.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_basic_operations_m3,arithmetic,basic operations,B,0.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_basic_operations_h1,arithmetic,basic operations,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_basic_operations_h2,arithmetic,basic operations,A,1.0,0.9,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_basic_operations_h3,arithmetic,basic operations,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_fractions_e1,arithmetic,fractions,A,1.0,0.95,A,0.85,A,0.95,B,0.9,A
Qwen2.5-7B-Instruct,arithmetic_fractions_e2,arithmetic,fractions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_fractions_e3,arithmetic,fractions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_fractions_m1,arithmetic,fractions,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_fractions_m2,arithmetic,fractions,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_fractions_m3,arithmetic,fractions,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_fractions_h2,arithmetic,fractions,A,0.0,0.95,B,1.0,B,0.98,B,1.0,A
Qwen2.5-7B-Instruct,arithmetic_fractions_h3,arithmetic,fractions,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_percentages_e1,arithmetic,percentages,B,1.0,0.95,B,0.92,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_percentages_e2,arithmetic,percentages,A,0.0,0.85,B,0.85,A,0.95,B,0.9,A
Qwen2.5-7B-Instruct,arithmetic_percentages_e3,arithmetic,percentages,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_percentages_m1,arithmetic,percentages,B,1.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_percentages_m2,arithmetic,percentages,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_percentages_m3,arithmetic,percentages,B,1.0,0.9,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_percentages_h1,arithmetic,percentages,A,1.0,0.9,A,0.9,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_percentages_h2,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.9,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_percentages_h3,arithmetic,percentages,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_numerical_e1,arithmetic,numerical approximation,B,1.0,0.85,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,arithmetic_numerical_e2,arithmetic,numerical approximation,B,1.0,0.85,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,arithmetic_numerical_e3,arithmetic,numerical approximation,A,0.0,0.85,A,0.65,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_numerical_m1,arithmetic,numerical approximation,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_numerical_m2,arithmetic,numerical approximation,B,1.0,0.85,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,0.85,A,0.98,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_numerical_h1,arithmetic,numerical approximation,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_numerical_h2,arithmetic,numerical approximation,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_numerical_h3,arithmetic,numerical approximation,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,arithmetic_order_e1,arithmetic,order of operations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_order_e2,arithmetic,order of operations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_order_e3,arithmetic,order of operations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_order_m1,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_order_m2,arithmetic,order of operations,A,1.0,0.9,A,0.8,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,arithmetic_order_m3,arithmetic,order of operations,A,0.0,0.95,A,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_order_h1,arithmetic,order of operations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_order_h2,arithmetic,order of operations,B,1.0,0.9,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,arithmetic_order_h3,arithmetic,order of operations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_equations_e1,algebra,equations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_equations_e2,algebra,equations,A,0.0,0.85,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,algebra_equations_e3,algebra,equations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_equations_m1,algebra,equations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_equations_m2,algebra,equations,A,0.0,0.9,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,algebra_equations_m3,algebra,equations,A,1.0,0.85,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_equations_h1,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B-Instruct,algebra_equations_h2,algebra,equations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,algebra_equations_h3,algebra,equations,A,0.0,0.85,B,0.98,B,0.98,B,1.0,A
Qwen2.5-7B-Instruct,algebra_inequalities_e1,algebra,inequalities,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_inequalities_e2,algebra,inequalities,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_inequalities_e3,algebra,inequalities,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_inequalities_m1,algebra,inequalities,B,1.0,0.85,B,0.9,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,algebra_inequalities_m2,algebra,inequalities,A,0.0,0.9,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,algebra_inequalities_m3,algebra,inequalities,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_inequalities_h1,algebra,inequalities,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,algebra_inequalities_h2,algebra,inequalities,A,1.0,0.95,A,1.0,A,0.98,A,1.0,A
Qwen2.5-7B-Instruct,algebra_inequalities_h3,algebra,inequalities,A,0.0,0.85,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_polynomials_e1,algebra,polynomials,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_polynomials_e2,algebra,polynomials,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,algebra_polynomials_e3,algebra,polynomials,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_polynomials_m1,algebra,polynomials,A,1.0,0.85,A,0.75,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_polynomials_m2,algebra,polynomials,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_polynomials_m3,algebra,polynomials,A,0.0,0.95,B,0.95,B,0.98,A,0.95,A
Qwen2.5-7B-Instruct,algebra_polynomials_h1,algebra,polynomials,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_polynomials_h2,algebra,polynomials,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_polynomials_h3,algebra,polynomials,A,0.0,0.6,B,0.75,B,0.9,B,0.7,B
Qwen2.5-7B-Instruct,algebra_functions_e1,algebra,functions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_functions_e2,algebra,functions,A,1.0,0.95,A,0.9,A,0.98,B,1.0,B
Qwen2.5-7B-Instruct,algebra_functions_e3,algebra,functions,A,1.0,0.85,A,0.95,A,0.95,A,0.9,A
Qwen2.5-7B-Instruct,algebra_functions_m1,algebra,functions,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,algebra_functions_m2,algebra,functions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,algebra_functions_m3,algebra,functions,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_functions_h1,algebra,functions,A,1.0,0.95,A,0.85,A,0.95,A,1.0,A
Qwen2.5-7B-Instruct,algebra_functions_h2,algebra,functions,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,algebra_functions_h3,algebra,functions,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,algebra_systems_e1,algebra,systems of equations,B,1.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_systems_e2,algebra,systems of equations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,algebra_systems_e3,algebra,systems of equations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,algebra_systems_m1,algebra,systems of equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_systems_m2,algebra,systems of equations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_systems_m3,algebra,systems of equations,B,1.0,0.95,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,algebra_systems_h1,algebra,systems of equations,B,1.0,0.9,B,0.97,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,algebra_systems_h2,algebra,systems of equations,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,algebra_systems_h3,algebra,systems of equations,A,1.0,0.9,A,0.95,A,0.98,A,1.0,B
Qwen2.5-7B-Instruct,calculus_differentiation_e1,calculus,differentiation,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_differentiation_e2,calculus,differentiation,A,0.0,0.85,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.85,A,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_differentiation_m1,calculus,differentiation,A,1.0,0.85,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_differentiation_m2,calculus,differentiation,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_differentiation_m3,calculus,differentiation,A,1.0,0.95,A,0.98,A,0.98,A,1.0,A
Qwen2.5-7B-Instruct,calculus_differentiation_h1,calculus,differentiation,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,calculus_differentiation_h2,calculus,differentiation,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,calculus_differentiation_h3,calculus,differentiation,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_integration_e1,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_integration_e2,calculus,integration,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,calculus_integration_e3,calculus,integration,A,1.0,0.85,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_integration_m1,calculus,integration,B,1.0,0.95,B,0.92,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,calculus_integration_m2,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_integration_m3,calculus,integration,A,1.0,0.85,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_integration_h1,calculus,integration,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_integration_h2,calculus,integration,A,1.0,0.95,A,0.9,A,0.98,A,0.95,B
Qwen2.5-7B-Instruct,calculus_integration_h3,calculus,integration,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,calculus_limits_e1,calculus,limits,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_limits_e2,calculus,limits,A,1.0,0.9,A,0.95,A,0.95,B,1.0,A
Qwen2.5-7B-Instruct,calculus_limits_e3,calculus,limits,A,0.0,0.85,B,0.95,B,0.98,B,0.95,A
Qwen2.5-7B-Instruct,calculus_limits_m1,calculus,limits,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_limits_m2,calculus,limits,A,1.0,0.95,A,0.8,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,calculus_limits_m3,calculus,limits,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_limits_h1,calculus,limits,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_limits_h2,calculus,limits,A,1.0,0.95,A,0.9,A,0.98,A,0.95,B
Qwen2.5-7B-Instruct,calculus_limits_h3,calculus,limits,A,1.0,0.95,A,0.8,A,0.95,B,0.9,B
Qwen2.5-7B-Instruct,calculus_series_e1,calculus,series,A,1.0,0.95,B,0.95,A,0.95,A,0.9,A
Qwen2.5-7B-Instruct,calculus_series_e2,calculus,series,A,0.0,0.9,B,0.95,A,0.95,B,0.9,A
Qwen2.5-7B-Instruct,calculus_series_e3,calculus,series,A,0.0,0.95,B,0.75,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,calculus_series_m1,calculus,series,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_series_m2,calculus,series,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,calculus_series_m3,calculus,series,A,0.0,0.9,B,0.98,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,calculus_series_h1,calculus,series,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_series_h2,calculus,series,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_series_h3,calculus,series,A,0.0,0.95,B,0.85,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,calculus_applications_e1,calculus,applications,A,1.0,0.95,A,0.8,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_applications_e2,calculus,applications,A,1.0,0.85,A,0.9,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,calculus_applications_e3,calculus,applications,A,0.0,0.85,B,0.85,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,calculus_applications_m1,calculus,applications,A,1.0,0.95,A,0.75,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,calculus_applications_m2,calculus,applications,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_applications_m3,calculus,applications,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_applications_h1,calculus,applications,A,0.0,0.95,B,1.0,B,1.0,B,1.0,B
Qwen2.5-7B-Instruct,calculus_applications_h2,calculus,applications,A,1.0,0.95,A,0.6,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,calculus_applications_h3,calculus,applications,B,1.0,0.95,B,1.0,B,0.98,B,1.0,B
Qwen2.5-7B-Instruct,geometry_plane_e1,geometry,plane geometry,A,1.0,0.85,A,0.95,A,0.95,B,0.85,A
Qwen2.5-7B-Instruct,geometry_plane_e2,geometry,plane geometry,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_plane_e3,geometry,plane geometry,A,0.0,0.85,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,geometry_plane_m1,geometry,plane geometry,A,0.0,0.85,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B-Instruct,geometry_plane_m2,geometry,plane geometry,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_plane_m3,geometry,plane geometry,A,1.0,0.85,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_plane_h1,geometry,plane geometry,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_plane_h2,geometry,plane geometry,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_plane_h3,geometry,plane geometry,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_e1,geometry,coordinate geometry,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_e2,geometry,coordinate geometry,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_e3,geometry,coordinate geometry,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_m1,geometry,coordinate geometry,B,1.0,0.85,B,0.98,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_m2,geometry,coordinate geometry,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_m3,geometry,coordinate geometry,A,0.0,0.9,B,0.95,B,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_h1,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_coordinate_h2,geometry,coordinate geometry,B,1.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_coordinate_h3,geometry,coordinate geometry,B,0.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,geometry_transformations_e1,geometry,transformations,A,1.0,0.85,B,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_transformations_e2,geometry,transformations,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_transformations_e3,geometry,transformations,A,0.0,0.85,B,0.95,B,0.98,B,0.95,A
Qwen2.5-7B-Instruct,geometry_transformations_m1,geometry,transformations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_transformations_m2,geometry,transformations,B,0.0,0.85,A,1.0,A,0.9,A,0.9,B
Qwen2.5-7B-Instruct,geometry_transformations_m3,geometry,transformations,A,0.0,0.85,B,0.8,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_transformations_h1,geometry,transformations,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,geometry_transformations_h2,geometry,transformations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B-Instruct,geometry_transformations_h3,geometry,transformations,B,1.0,0.95,B,0.9,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_mensuration_e1,geometry,mensuration,A,0.0,0.95,B,1.0,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_mensuration_e2,geometry,mensuration,B,1.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_mensuration_e3,geometry,mensuration,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,geometry_mensuration_m1,geometry,mensuration,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,geometry_mensuration_m2,geometry,mensuration,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_mensuration_m3,geometry,mensuration,A,0.0,0.95,B,0.9,B,0.95,A,1.0,B
Qwen2.5-7B-Instruct,geometry_mensuration_h1,geometry,mensuration,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,geometry_mensuration_h2,geometry,mensuration,B,1.0,0.95,B,0.7,B,0.9,,,B
Qwen2.5-7B-Instruct,geometry_mensuration_h3,geometry,mensuration,A,0.0,0.95,B,0.7,B,0.95,A,0.8,B
Qwen2.5-7B-Instruct,geometry_trigonometry_e1,geometry,trigonometry,A,0.0,0.85,B,1.0,B,0.98,B,1.0,B
Qwen2.5-7B-Instruct,geometry_trigonometry_e2,geometry,trigonometry,A,0.0,0.85,B,1.0,B,0.85,B,0.9,A
Qwen2.5-7B-Instruct,geometry_trigonometry_e3,geometry,trigonometry,A,0.0,0.95,B,0.8,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,geometry_trigonometry_m1,geometry,trigonometry,A,0.0,0.9,B,0.95,B,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_trigonometry_m2,geometry,trigonometry,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_trigonometry_m3,geometry,trigonometry,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,geometry_trigonometry_h1,geometry,trigonometry,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,geometry_trigonometry_h2,geometry,trigonometry,A,0.0,0.95,B,0.75,B,0.95,,,B
Qwen2.5-7B-Instruct,geometry_trigonometry_h3,geometry,trigonometry,A,1.0,0.85,A,0.85,A,0.85,A,0.95,B
Qwen2.5-7B-Instruct,numbertheory_divisibility_e1,number theory,divisibility,A,0.0,0.85,B,0.95,B,0.95,B,1.0,A
Qwen2.5-7B-Instruct,numbertheory_divisibility_e2,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_divisibility_e3,number theory,divisibility,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_divisibility_m1,number theory,divisibility,B,1.0,0.85,B,0.95,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,numbertheory_divisibility_m2,number theory,divisibility,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,numbertheory_divisibility_m3,number theory,divisibility,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_divisibility_h1,number theory,divisibility,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_divisibility_h2,number theory,divisibility,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,numbertheory_divisibility_h3,number theory,divisibility,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_modular_e1,number theory,modular arithmetic,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_modular_e2,number theory,modular arithmetic,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_modular_e3,number theory,modular arithmetic,A,0.0,0.95,A,0.95,B,0.95,B,1.0,A
Qwen2.5-7B-Instruct,numbertheory_modular_m1,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,numbertheory_modular_m2,number theory,modular arithmetic,A,1.0,0.95,A,0.9,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,numbertheory_modular_m3,number theory,modular arithmetic,A,0.0,0.95,B,0.85,A,0.98,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_modular_h1,number theory,modular arithmetic,A,0.0,0.85,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_modular_h2,number theory,modular arithmetic,A,0.0,0.95,B,0.6,A,0.98,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_modular_h3,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_primes_e1,number theory,primes,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_primes_e2,number theory,primes,A,1.0,0.85,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B-Instruct,numbertheory_primes_e3,number theory,primes,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_primes_m1,number theory,primes,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,numbertheory_primes_m2,number theory,primes,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,numbertheory_primes_m3,number theory,primes,A,1.0,0.85,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_primes_h1,number theory,primes,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_primes_h2,number theory,primes,A,0.0,0.85,B,1.0,B,0.99,B,1.0,B
Qwen2.5-7B-Instruct,numbertheory_primes_h3,number theory,primes,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_diophantine_e1,number theory,diophantine equations,A,0.0,0.95,B,0.95,B,0.95,B,1.0,A
Qwen2.5-7B-Instruct,numbertheory_diophantine_e2,number theory,diophantine equations,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,numbertheory_diophantine_e3,number theory,diophantine equations,A,1.0,0.95,B,0.75,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,numbertheory_diophantine_m1,number theory,diophantine equations,A,0.0,0.9,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_diophantine_m2,number theory,diophantine equations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_diophantine_m3,number theory,diophantine equations,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_diophantine_h1,number theory,diophantine equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,numbertheory_diophantine_h2,number theory,diophantine equations,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,numbertheory_diophantine_h3,number theory,diophantine equations,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_sequences_e1,number theory,number sequences,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_sequences_e2,number theory,number sequences,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,numbertheory_sequences_e3,number theory,number sequences,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Qwen2.5-7B-Instruct,numbertheory_sequences_m1,number theory,number sequences,A,0.0,0.95,B,0.8,B,0.98,B,1.0,A
Qwen2.5-7B-Instruct,numbertheory_sequences_m2,number theory,number sequences,A,1.0,0.95,B,0.65,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,numbertheory_sequences_m3,number theory,number sequences,A,1.0,0.95,A,0.95,A,0.95,A,0.9,A
Qwen2.5-7B-Instruct,numbertheory_sequences_h1,number theory,number sequences,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,numbertheory_sequences_h2,number theory,number sequences,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,numbertheory_sequences_h3,number theory,number sequences,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_counting_e1,combinatorics,counting principles,B,1.0,0.95,A,0.85,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_counting_e2,combinatorics,counting principles,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_counting_e3,combinatorics,counting principles,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_counting_m1,combinatorics,counting principles,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_counting_m2,combinatorics,counting principles,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_counting_m3,combinatorics,counting principles,B,0.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_counting_h1,combinatorics,counting principles,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_counting_h2,combinatorics,counting principles,A,0.0,0.85,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_counting_h3,combinatorics,counting principles,A,1.0,0.95,A,0.6,A,0.95,A,0.7,B
Qwen2.5-7B-Instruct,combinatorics_permutations_e1,combinatorics,permutations,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_permutations_e2,combinatorics,permutations,A,0.0,0.85,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B-Instruct,combinatorics_permutations_e3,combinatorics,permutations,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_permutations_m1,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_permutations_m2,combinatorics,permutations,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_permutations_m3,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.95,B,1.0,B
Qwen2.5-7B-Instruct,combinatorics_permutations_h1,combinatorics,permutations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_permutations_h2,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_permutations_h3,combinatorics,permutations,B,0.0,0.85,A,0.65,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_combinations_e1,combinatorics,combinations,B,0.0,0.95,A,0.85,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_combinations_e2,combinatorics,combinations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_combinations_e3,combinatorics,combinations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_combinations_m1,combinatorics,combinations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_combinations_m2,combinatorics,combinations,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_combinations_m3,combinatorics,combinations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_combinations_h1,combinatorics,combinations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_combinations_h2,combinatorics,combinations,A,1.0,0.95,B,0.75,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_combinations_h3,combinatorics,combinations,A,0.0,0.95,B,1.0,B,0.98,B,1.0,B
Qwen2.5-7B-Instruct,combinatorics_probability_e1,combinatorics,probability,A,1.0,0.95,B,0.9,A,0.95,A,0.9,A
Qwen2.5-7B-Instruct,combinatorics_probability_e2,combinatorics,probability,A,0.0,0.9,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_probability_e3,combinatorics,probability,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_probability_m1,combinatorics,probability,A,1.0,0.85,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_probability_m2,combinatorics,probability,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_probability_m3,combinatorics,probability,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,combinatorics_probability_h1,combinatorics,probability,A,1.0,0.95,A,1.0,A,0.98,A,1.0,B
Qwen2.5-7B-Instruct,combinatorics_probability_h2,combinatorics,probability,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_probability_h3,combinatorics,probability,B,1.0,0.95,B,0.95,B,0.99,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_recursion_e1,combinatorics,recursion,B,1.0,0.85,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_recursion_e2,combinatorics,recursion,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,combinatorics_recursion_e3,combinatorics,recursion,A,0.0,0.85,A,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_recursion_m1,combinatorics,recursion,A,0.0,0.95,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_recursion_m2,combinatorics,recursion,B,1.0,0.95,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,combinatorics_recursion_m3,combinatorics,recursion,B,1.0,0.85,B,0.95,B,0.9,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_recursion_h1,combinatorics,recursion,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,combinatorics_recursion_h2,combinatorics,recursion,A,1.0,0.9,A,0.98,A,0.95,A,1.0,A
Qwen2.5-7B-Instruct,combinatorics_recursion_h3,combinatorics,recursion,A,0.0,0.85,B,0.95,B,0.9,B,1.0,B
Qwen2.5-7B-Instruct,statistics_descriptive_e1,statistics,descriptive statistics,A,1.0,0.85,B,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_descriptive_m1,statistics,descriptive statistics,A,0.0,0.95,B,0.95,A,1.0,B,0.9,B
Qwen2.5-7B-Instruct,statistics_descriptive_m2,statistics,descriptive statistics,A,0.0,0.95,B,0.85,B,0.95,A,0.8,B
Qwen2.5-7B-Instruct,statistics_descriptive_m3,statistics,descriptive statistics,A,0.0,0.95,B,0.85,B,0.85,,,A
Qwen2.5-7B-Instruct,statistics_descriptive_h1,statistics,descriptive statistics,A,1.0,0.95,A,0.85,A,0.95,B,0.9,A
Qwen2.5-7B-Instruct,statistics_descriptive_h2,statistics,descriptive statistics,A,0.0,0.95,B,0.9,B,0.95,,,B
Qwen2.5-7B-Instruct,statistics_descriptive_h3,statistics,descriptive statistics,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,statistics_distributions_e1,statistics,distributions,B,1.0,0.9,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,statistics_distributions_e2,statistics,distributions,B,1.0,0.85,B,0.85,B,0.95,A,1.0,B
Qwen2.5-7B-Instruct,statistics_distributions_e3,statistics,distributions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_distributions_m1,statistics,distributions,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_distributions_m2,statistics,distributions,A,1.0,0.95,B,0.95,A,0.95,A,0.9,A
Qwen2.5-7B-Instruct,statistics_distributions_m3,statistics,distributions,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,statistics_distributions_h1,statistics,distributions,A,0.0,0.95,B,0.85,A,0.95,B,0.9,A
Qwen2.5-7B-Instruct,statistics_distributions_h2,statistics,distributions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_distributions_h3,statistics,distributions,A,1.0,0.9,A,0.85,A,0.98,B,0.95,B
Qwen2.5-7B-Instruct,statistics_hypothesis_e1,statistics,hypothesis testing,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_hypothesis_e2,statistics,hypothesis testing,A,1.0,0.85,A,0.85,A,0.92,A,0.8,A
Qwen2.5-7B-Instruct,statistics_hypothesis_e3,statistics,hypothesis testing,A,1.0,0.85,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,statistics_hypothesis_m1,statistics,hypothesis testing,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_hypothesis_m2,statistics,hypothesis testing,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,statistics_hypothesis_m3,statistics,hypothesis testing,A,1.0,0.95,A,0.85,B,0.9,A,0.9,A
Qwen2.5-7B-Instruct,statistics_hypothesis_h1,statistics,hypothesis testing,A,0.0,0.85,B,0.95,B,0.95,A,0.9,B
Qwen2.5-7B-Instruct,statistics_hypothesis_h2,statistics,hypothesis testing,A,1.0,0.9,A,0.95,A,0.95,B,0.8,A
Qwen2.5-7B-Instruct,statistics_hypothesis_h3,statistics,hypothesis testing,A,1.0,0.85,A,0.65,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,statistics_regression_e1,statistics,regression,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,statistics_regression_e2,statistics,regression,A,0.0,0.85,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,statistics_regression_e3,statistics,regression,A,1.0,0.85,A,0.85,A,0.95,B,0.9,B
Qwen2.5-7B-Instruct,statistics_regression_m1,statistics,regression,A,0.0,0.95,A,0.6,B,0.85,B,0.8,A
Qwen2.5-7B-Instruct,statistics_regression_m2,statistics,regression,A,1.0,0.95,A,0.85,A,0.95,A,1.0,A
Qwen2.5-7B-Instruct,statistics_regression_m3,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,statistics_regression_h1,statistics,regression,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,statistics_regression_h2,statistics,regression,A,0.0,0.95,B,0.9,A,0.95,B,0.9,B
Qwen2.5-7B-Instruct,statistics_regression_h3,statistics,regression,A,0.0,0.9,B,0.9,B,0.98,B,0.95,A
Qwen2.5-7B-Instruct,statistics_bayesian_e1,statistics,bayesian inference,B,1.0,0.95,B,0.85,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,statistics_bayesian_e2,statistics,bayesian inference,A,0.0,0.9,B,0.85,A,0.95,B,0.9,B
Qwen2.5-7B-Instruct,statistics_bayesian_e3,statistics,bayesian inference,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,statistics_bayesian_m1,statistics,bayesian inference,A,1.0,0.95,A,0.75,B,0.95,A,0.8,B
Qwen2.5-7B-Instruct,statistics_bayesian_m2,statistics,bayesian inference,A,0.0,0.95,B,0.85,B,0.95,B,1.0,B
Qwen2.5-7B-Instruct,statistics_bayesian_m3,statistics,bayesian inference,A,1.0,0.95,A,0.9,A,0.98,A,0.95,B
Qwen2.5-7B-Instruct,statistics_bayesian_h1,statistics,bayesian inference,A,0.0,0.95,B,0.98,B,0.98,B,1.0,A
Qwen2.5-7B-Instruct,statistics_bayesian_h2,statistics,bayesian inference,A,1.0,0.95,A,0.75,A,0.85,A,0.8,A
Qwen2.5-7B-Instruct,statistics_bayesian_h3,statistics,bayesian inference,A,1.0,0.95,A,0.8,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_matrices_e1,linear algebra,matrices,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_matrices_e2,linear algebra,matrices,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_matrices_e3,linear algebra,matrices,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_matrices_m1,linear algebra,matrices,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_matrices_m2,linear algebra,matrices,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_matrices_m3,linear algebra,matrices,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_matrices_h1,linear algebra,matrices,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_matrices_h2,linear algebra,matrices,A,1.0,0.9,A,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_matrices_h3,linear algebra,matrices,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_determinants_e1,linear algebra,determinants,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B-Instruct,linearalgebra_determinants_e2,linear algebra,determinants,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_determinants_e3,linear algebra,determinants,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_determinants_m1,linear algebra,determinants,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_determinants_m2,linear algebra,determinants,A,0.0,0.95,B,0.98,B,0.95,B,1.0,A
Qwen2.5-7B-Instruct,linearalgebra_determinants_m3,linear algebra,determinants,B,1.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_determinants_h1,linear algebra,determinants,B,1.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_determinants_h2,linear algebra,determinants,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_determinants_h3,linear algebra,determinants,A,1.0,0.95,A,0.95,A,0.98,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,A,0.0,0.9,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,A,1.0,0.95,A,0.95,A,0.95,A,0.9,A
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,1.0,0.85,B,0.85,A,0.95,A,1.0,B
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,1.0,0.95,B,0.8,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,A,0.0,0.9,B,0.85,B,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,A,0.0,0.7,B,0.9,B,0.95,B,0.9,A
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,A,1.0,0.85,A,0.85,A,0.9,A,0.9,A
Qwen2.5-7B-Instruct,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,A,1.0,0.95,A,0.6,A,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_transformations_e1,linear algebra,linear transformations,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_transformations_e2,linear algebra,linear transformations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_transformations_e3,linear algebra,linear transformations,A,1.0,0.85,B,0.75,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_transformations_m1,linear algebra,linear transformations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Qwen2.5-7B-Instruct,linearalgebra_transformations_m2,linear algebra,linear transformations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_transformations_m3,linear algebra,linear transformations,A,1.0,0.85,A,1.0,A,1.0,A,1.0,A
Qwen2.5-7B-Instruct,linearalgebra_transformations_h1,linear algebra,linear transformations,A,1.0,0.95,B,0.95,A,0.95,,,A
Qwen2.5-7B-Instruct,linearalgebra_transformations_h2,linear algebra,linear transformations,B,1.0,0.95,B,0.95,B,0.98,B,0.95,A
Qwen2.5-7B-Instruct,linearalgebra_transformations_h3,linear algebra,linear transformations,A,0.0,0.9,B,0.92,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_e1,arithmetic,basic operations,A,1.0,0.8,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_e2,arithmetic,basic operations,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_e3,arithmetic,basic operations,A,1.0,0.8,A,0.7,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_m1,arithmetic,basic operations,A,1.0,1.0,A,0.85,A,0.98,A,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_m2,arithmetic,basic operations,B,1.0,0.85,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_m3,arithmetic,basic operations,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_h1,arithmetic,basic operations,A,1.0,0.95,B,0.85,A,0.9,,,A
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_h2,arithmetic,basic operations,A,0.0,1.0,B,0.95,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_basic_operations_h3,arithmetic,basic operations,B,0.0,0.9,A,0.51,A,0.95,A,0.9,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_e1,arithmetic,fractions,B,1.0,0.85,B,0.95,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_e2,arithmetic,fractions,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_e3,arithmetic,fractions,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_m1,arithmetic,fractions,B,0.0,0.95,B,0.55,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_m2,arithmetic,fractions,A,1.0,0.8,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_m3,arithmetic,fractions,B,0.0,1.0,A,0.55,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_h2,arithmetic,fractions,Tie,0.5,0.5,A,0.6,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_fractions_h3,arithmetic,fractions,A,0.0,0.95,B,0.95,B,0.99,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_e1,arithmetic,percentages,B,0.0,0.9,A,0.9,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_e2,arithmetic,percentages,A,1.0,0.8,B,0.75,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_e3,arithmetic,percentages,A,1.0,0.9,A,0.55,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_m1,arithmetic,percentages,A,0.0,0.9,B,0.95,B,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_m2,arithmetic,percentages,A,0.0,0.85,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_m3,arithmetic,percentages,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_h1,arithmetic,percentages,A,1.0,1.0,A,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_h2,arithmetic,percentages,A,1.0,1.0,B,0.51,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_percentages_h3,arithmetic,percentages,B,0.0,0.85,A,1.0,A,1.0,A,1.0,B
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_e1,arithmetic,numerical approximation,A,0.0,0.9,B,0.75,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_e2,arithmetic,numerical approximation,B,0.0,0.9,B,0.55,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_e3,arithmetic,numerical approximation,A,1.0,1.0,A,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_m1,arithmetic,numerical approximation,A,1.0,0.9,A,0.85,B,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_m2,arithmetic,numerical approximation,A,0.0,1.0,A,0.85,B,0.85,B,0.8,B
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,0.85,A,0.8,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_h1,arithmetic,numerical approximation,B,0.0,1.0,A,0.6,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_h2,arithmetic,numerical approximation,B,1.0,1.0,B,0.85,B,0.9,A,1.0,B
Qwen2.5-Math-7B-Instruct,arithmetic_numerical_h3,arithmetic,numerical approximation,Tie,0.5,0.5,B,0.6,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_order_e1,arithmetic,order of operations,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,arithmetic_order_e2,arithmetic,order of operations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_order_e3,arithmetic,order of operations,B,1.0,0.9,B,0.98,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_order_m1,arithmetic,order of operations,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,arithmetic_order_m2,arithmetic,order of operations,A,0.0,1.0,B,0.85,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,arithmetic_order_m3,arithmetic,order of operations,Tie,0.5,0.5,B,0.95,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,arithmetic_order_h1,arithmetic,order of operations,A,1.0,0.85,A,0.5,A,1.0,A,1.0,A
Qwen2.5-Math-7B-Instruct,arithmetic_order_h2,arithmetic,order of operations,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,arithmetic_order_h3,arithmetic,order of operations,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_equations_e1,algebra,equations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_equations_e2,algebra,equations,A,1.0,0.9,A,0.55,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_equations_e3,algebra,equations,A,0.0,0.9,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_equations_m1,algebra,equations,A,0.0,0.9,B,0.95,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_equations_m2,algebra,equations,B,0.0,0.85,B,0.75,A,0.95,A,0.9,A
Qwen2.5-Math-7B-Instruct,algebra_equations_m3,algebra,equations,A,1.0,1.0,A,0.7,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_equations_h1,algebra,equations,A,1.0,0.8,A,0.5,A,0.95,A,0.6,A
Qwen2.5-Math-7B-Instruct,algebra_equations_h2,algebra,equations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_equations_h3,algebra,equations,B,0.0,0.9,A,1.0,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,algebra_inequalities_e1,algebra,inequalities,A,1.0,1.0,A,0.51,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_inequalities_e2,algebra,inequalities,B,1.0,0.8,B,0.95,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_inequalities_e3,algebra,inequalities,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_inequalities_m1,algebra,inequalities,Tie,0.5,0.5,B,0.9,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_inequalities_m2,algebra,inequalities,B,1.0,0.85,B,0.95,B,0.95,B,1.0,B
Qwen2.5-Math-7B-Instruct,algebra_inequalities_m3,algebra,inequalities,A,0.0,0.9,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_inequalities_h1,algebra,inequalities,A,1.0,0.9,B,0.55,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_inequalities_h2,algebra,inequalities,A,1.0,0.9,B,0.51,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,algebra_inequalities_h3,algebra,inequalities,A,0.0,0.85,B,0.51,A,0.99,B,0.7,B
Qwen2.5-Math-7B-Instruct,algebra_polynomials_e1,algebra,polynomials,B,0.0,0.85,B,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_polynomials_e2,algebra,polynomials,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_polynomials_e3,algebra,polynomials,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_polynomials_m1,algebra,polynomials,A,1.0,0.9,B,0.55,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_polynomials_m2,algebra,polynomials,A,1.0,1.0,A,0.5,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_polynomials_m3,algebra,polynomials,Tie,0.5,0.5,A,0.85,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,algebra_polynomials_h1,algebra,polynomials,A,1.0,0.9,A,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_polynomials_h2,algebra,polynomials,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_polynomials_h3,algebra,polynomials,Tie,0.5,0.5,A,0.6,B,0.9,A,0.75,B
Qwen2.5-Math-7B-Instruct,algebra_functions_e1,algebra,functions,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_functions_e2,algebra,functions,A,0.0,1.0,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_functions_e3,algebra,functions,Tie,0.5,0.5,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_functions_m1,algebra,functions,A,1.0,0.9,A,0.95,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_functions_m2,algebra,functions,B,0.0,0.9,A,0.6,A,0.98,A,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_functions_m3,algebra,functions,B,1.0,1.0,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_functions_h1,algebra,functions,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_functions_h2,algebra,functions,A,1.0,0.95,A,0.85,A,0.98,A,1.0,B
Qwen2.5-Math-7B-Instruct,algebra_functions_h3,algebra,functions,B,0.0,1.0,B,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_systems_e1,algebra,systems of equations,A,1.0,0.95,A,0.7,A,0.95,A,0.9,A
Qwen2.5-Math-7B-Instruct,algebra_systems_e2,algebra,systems of equations,A,0.0,1.0,B,0.95,B,0.98,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_systems_e3,algebra,systems of equations,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,algebra_systems_m1,algebra,systems of equations,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
Qwen2.5-Math-7B-Instruct,algebra_systems_m2,algebra,systems of equations,Tie,0.5,0.5,A,0.5,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,algebra_systems_m3,algebra,systems of equations,Tie,0.5,0.5,A,0.98,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,algebra_systems_h1,algebra,systems of equations,A,1.0,0.8,B,0.51,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,algebra_systems_h2,algebra,systems of equations,A,1.0,1.0,A,0.95,A,0.98,A,1.0,B
Qwen2.5-Math-7B-Instruct,algebra_systems_h3,algebra,systems of equations,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_differentiation_e1,calculus,differentiation,A,1.0,1.0,A,0.85,A,0.98,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_differentiation_e2,calculus,differentiation,B,1.0,0.9,A,0.9,B,0.95,B,1.0,B
Qwen2.5-Math-7B-Instruct,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,calculus_differentiation_m1,calculus,differentiation,Tie,0.5,0.5,B,0.95,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_differentiation_m2,calculus,differentiation,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_differentiation_m3,calculus,differentiation,Tie,0.5,0.5,A,0.5,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_differentiation_h1,calculus,differentiation,A,1.0,0.85,A,0.6,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_differentiation_h2,calculus,differentiation,Tie,0.5,0.5,B,0.51,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_differentiation_h3,calculus,differentiation,A,1.0,0.95,A,0.55,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,calculus_integration_e1,calculus,integration,Tie,0.5,0.5,A,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_integration_e2,calculus,integration,Tie,0.5,0.5,B,0.65,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_integration_e3,calculus,integration,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_integration_m1,calculus,integration,A,1.0,0.95,A,0.55,A,0.99,A,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_integration_m2,calculus,integration,B,0.0,0.9,B,0.51,A,1.0,A,1.0,B
Qwen2.5-Math-7B-Instruct,calculus_integration_m3,calculus,integration,Tie,0.5,0.5,B,0.51,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,calculus_integration_h1,calculus,integration,Tie,0.5,0.5,A,0.5,A,1.0,A,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_integration_h2,calculus,integration,B,0.0,0.9,A,0.75,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_integration_h3,calculus,integration,B,1.0,1.0,B,0.95,B,1.0,B,1.0,A
Qwen2.5-Math-7B-Instruct,calculus_limits_e1,calculus,limits,A,0.0,1.0,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_limits_e2,calculus,limits,A,0.0,1.0,B,0.9,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_limits_e3,calculus,limits,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_limits_m1,calculus,limits,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_limits_m2,calculus,limits,B,0.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_limits_m3,calculus,limits,A,0.0,0.95,B,0.85,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,calculus_limits_h1,calculus,limits,Tie,0.5,0.5,B,0.51,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,calculus_limits_h2,calculus,limits,A,0.0,0.9,B,0.85,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_limits_h3,calculus,limits,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_series_e1,calculus,series,Tie,0.5,0.5,B,0.51,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_series_e2,calculus,series,A,1.0,1.0,B,0.65,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,calculus_series_e3,calculus,series,A,0.0,0.5,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_series_m1,calculus,series,B,1.0,0.95,B,0.95,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,calculus_series_m2,calculus,series,A,1.0,0.95,B,0.85,A,0.95,A,0.9,B
Qwen2.5-Math-7B-Instruct,calculus_series_m3,calculus,series,B,0.0,0.85,B,0.9,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_series_h1,calculus,series,B,1.0,1.0,B,0.9,B,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_series_h2,calculus,series,A,0.0,1.0,B,0.85,A,0.99,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_series_h3,calculus,series,B,0.0,0.8,B,0.51,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_applications_e1,calculus,applications,A,1.0,1.0,A,0.8,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_applications_e2,calculus,applications,A,1.0,0.9,A,0.75,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,calculus_applications_e3,calculus,applications,A,0.0,0.85,B,0.9,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,calculus_applications_m1,calculus,applications,A,1.0,1.0,A,0.51,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_applications_m2,calculus,applications,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_applications_m3,calculus,applications,A,0.0,0.9,B,0.55,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,calculus_applications_h1,calculus,applications,A,1.0,0.9,A,0.55,A,0.98,B,1.0,B
Qwen2.5-Math-7B-Instruct,calculus_applications_h2,calculus,applications,Tie,0.5,0.5,A,0.51,A,0.99,A,0.95,A
Qwen2.5-Math-7B-Instruct,calculus_applications_h3,calculus,applications,Tie,0.5,0.5,A,0.85,A,0.98,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_plane_e1,geometry,plane geometry,B,0.0,1.0,A,0.9,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_plane_e2,geometry,plane geometry,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,geometry_plane_e3,geometry,plane geometry,B,1.0,1.0,B,0.85,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_plane_m1,geometry,plane geometry,B,1.0,1.0,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_plane_m2,geometry,plane geometry,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_plane_m3,geometry,plane geometry,B,1.0,0.8,B,0.92,B,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_plane_h1,geometry,plane geometry,B,1.0,0.9,B,0.95,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_plane_h2,geometry,plane geometry,A,0.0,0.9,B,0.85,B,0.98,B,1.0,B
Qwen2.5-Math-7B-Instruct,geometry_plane_h3,geometry,plane geometry,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_coordinate_e1,geometry,coordinate geometry,A,0.0,0.9,B,0.95,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,geometry_coordinate_e2,geometry,coordinate geometry,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,geometry_coordinate_e3,geometry,coordinate geometry,A,1.0,0.8,B,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_coordinate_m1,geometry,coordinate geometry,B,1.0,1.0,B,0.75,B,0.98,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_coordinate_m2,geometry,coordinate geometry,A,0.0,0.85,B,0.6,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_coordinate_m3,geometry,coordinate geometry,A,1.0,0.9,A,0.85,B,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_coordinate_h1,geometry,coordinate geometry,Tie,0.5,0.5,B,0.51,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_coordinate_h2,geometry,coordinate geometry,A,1.0,0.8,B,0.51,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_coordinate_h3,geometry,coordinate geometry,A,0.0,1.0,B,0.9,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_transformations_e1,geometry,transformations,A,0.0,0.95,B,0.51,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_transformations_e2,geometry,transformations,B,1.0,1.0,B,0.95,B,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,geometry_transformations_e3,geometry,transformations,B,1.0,0.8,B,0.95,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_transformations_m1,geometry,transformations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_transformations_m2,geometry,transformations,Tie,0.5,0.5,B,1.0,B,0.98,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_transformations_m3,geometry,transformations,B,0.0,1.0,A,0.55,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_transformations_h1,geometry,transformations,A,0.0,0.95,B,0.85,A,0.95,B,0.9,B
Qwen2.5-Math-7B-Instruct,geometry_transformations_h2,geometry,transformations,Tie,0.5,0.5,B,0.95,B,0.98,B,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_transformations_h3,geometry,transformations,A,0.0,1.0,B,0.9,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_mensuration_e1,geometry,mensuration,A,1.0,0.8,A,0.6,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,geometry_mensuration_e2,geometry,mensuration,A,0.0,1.0,B,0.85,B,0.98,B,1.0,A
Qwen2.5-Math-7B-Instruct,geometry_mensuration_e3,geometry,mensuration,A,1.0,0.8,B,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_mensuration_m1,geometry,mensuration,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_mensuration_m2,geometry,mensuration,A,1.0,0.8,A,0.75,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_mensuration_m3,geometry,mensuration,B,1.0,1.0,B,0.95,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,geometry_mensuration_h1,geometry,mensuration,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_mensuration_h2,geometry,mensuration,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_mensuration_h3,geometry,mensuration,Tie,0.5,0.5,A,0.95,A,0.75,B,0.75,A
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_e1,geometry,trigonometry,B,0.0,0.95,A,0.75,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_e2,geometry,trigonometry,A,0.0,0.9,B,0.95,B,0.95,B,1.0,B
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_e3,geometry,trigonometry,A,1.0,0.9,A,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_m1,geometry,trigonometry,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_m2,geometry,trigonometry,A,1.0,0.85,B,0.75,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_m3,geometry,trigonometry,A,1.0,0.8,A,0.6,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_h1,geometry,trigonometry,A,1.0,0.8,A,0.95,A,0.98,A,0.95,A
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_h2,geometry,trigonometry,Tie,0.5,0.5,A,1.0,A,0.98,,,A
Qwen2.5-Math-7B-Instruct,geometry_trigonometry_h3,geometry,trigonometry,A,1.0,1.0,A,0.9,B,0.95,A,0.9,B
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_e1,number theory,divisibility,A,1.0,0.9,B,0.51,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_e2,number theory,divisibility,A,1.0,0.95,B,0.65,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_e3,number theory,divisibility,A,0.0,1.0,B,0.9,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_m1,number theory,divisibility,B,1.0,0.85,B,0.85,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_m2,number theory,divisibility,A,0.0,0.9,B,0.9,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_m3,number theory,divisibility,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_h1,number theory,divisibility,Tie,0.5,0.5,B,0.85,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_h2,number theory,divisibility,Tie,0.5,0.5,B,0.85,B,0.99,B,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_divisibility_h3,number theory,divisibility,B,0.0,0.85,B,0.95,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,numbertheory_modular_e1,number theory,modular arithmetic,B,1.0,0.85,B,0.95,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,numbertheory_modular_e2,number theory,modular arithmetic,Tie,0.5,0.5,A,0.55,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_modular_e3,number theory,modular arithmetic,B,1.0,0.8,B,0.95,B,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,numbertheory_modular_m1,number theory,modular arithmetic,A,1.0,0.9,B,0.95,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_modular_m2,number theory,modular arithmetic,Tie,0.5,0.5,B,0.55,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_modular_m3,number theory,modular arithmetic,A,0.0,0.95,B,0.75,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_modular_h1,number theory,modular arithmetic,Tie,0.5,0.5,B,0.8,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_modular_h2,number theory,modular arithmetic,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_modular_h3,number theory,modular arithmetic,A,0.0,0.9,B,0.51,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_primes_e1,number theory,primes,B,1.0,0.9,B,0.6,A,1.0,B,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_primes_e2,number theory,primes,A,0.0,1.0,B,0.95,B,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,numbertheory_primes_e3,number theory,primes,A,1.0,0.85,B,0.6,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_primes_m1,number theory,primes,B,0.0,0.9,A,0.6,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_primes_m2,number theory,primes,A,0.0,1.0,B,0.95,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_primes_m3,number theory,primes,B,0.0,0.85,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_primes_h1,number theory,primes,Tie,0.5,0.5,A,0.95,A,0.95,B,0.9,B
Qwen2.5-Math-7B-Instruct,numbertheory_primes_h2,number theory,primes,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_primes_h3,number theory,primes,A,1.0,1.0,A,0.55,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_e1,number theory,diophantine equations,A,1.0,0.9,B,0.51,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_e2,number theory,diophantine equations,A,1.0,0.95,B,0.85,A,0.95,A,0.9,B
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_e3,number theory,diophantine equations,B,0.0,0.9,A,0.9,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_m1,number theory,diophantine equations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_m2,number theory,diophantine equations,B,1.0,0.95,B,0.55,B,0.99,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_m3,number theory,diophantine equations,B,0.0,0.85,A,1.0,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_h1,number theory,diophantine equations,B,1.0,1.0,B,0.85,B,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_h2,number theory,diophantine equations,A,0.0,0.85,B,0.85,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_diophantine_h3,number theory,diophantine equations,A,1.0,0.9,B,0.95,A,0.65,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_e1,number theory,number sequences,Tie,0.5,0.5,A,0.51,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_e2,number theory,number sequences,B,1.0,0.8,B,0.95,B,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_e3,number theory,number sequences,B,0.0,0.85,B,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_m1,number theory,number sequences,A,0.0,1.0,B,0.85,B,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_m2,number theory,number sequences,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_m3,number theory,number sequences,A,1.0,1.0,B,0.55,A,0.95,A,0.9,A
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_h1,number theory,number sequences,A,1.0,0.85,A,0.75,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_h2,number theory,number sequences,Tie,0.5,0.5,B,0.85,B,1.0,B,0.95,B
Qwen2.5-Math-7B-Instruct,numbertheory_sequences_h3,number theory,number sequences,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_counting_e1,combinatorics,counting principles,B,1.0,0.9,B,0.55,A,0.95,B,0.85,B
Qwen2.5-Math-7B-Instruct,combinatorics_counting_e2,combinatorics,counting principles,A,1.0,0.9,B,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_counting_e3,combinatorics,counting principles,A,0.0,1.0,B,0.85,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,combinatorics_counting_m1,combinatorics,counting principles,B,0.0,1.0,A,0.85,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,combinatorics_counting_m2,combinatorics,counting principles,A,1.0,0.8,B,0.75,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_counting_m3,combinatorics,counting principles,A,0.0,0.9,B,0.8,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_counting_h1,combinatorics,counting principles,Tie,0.5,0.5,B,0.95,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,combinatorics_counting_h2,combinatorics,counting principles,A,1.0,0.6,A,0.55,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_counting_h3,combinatorics,counting principles,A,1.0,1.0,A,0.7,A,0.95,B,1.0,B
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_e1,combinatorics,permutations,A,0.0,0.9,B,0.95,B,0.95,B,1.0,B
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_e2,combinatorics,permutations,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_e3,combinatorics,permutations,A,1.0,1.0,B,0.51,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_m1,combinatorics,permutations,Tie,0.5,0.5,B,0.6,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_m2,combinatorics,permutations,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_m3,combinatorics,permutations,A,0.0,1.0,B,0.55,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_h1,combinatorics,permutations,A,1.0,0.9,B,0.51,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_h2,combinatorics,permutations,A,0.0,1.0,B,0.55,A,1.0,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_permutations_h3,combinatorics,permutations,Tie,0.5,0.5,B,0.7,A,0.75,B,0.65,A
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_e1,combinatorics,combinations,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_e2,combinatorics,combinations,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_e3,combinatorics,combinations,B,1.0,0.9,B,0.51,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_m1,combinatorics,combinations,Tie,0.5,0.5,B,0.55,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_m2,combinatorics,combinations,B,1.0,1.0,B,0.85,B,0.95,B,0.6,A
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_m3,combinatorics,combinations,Tie,0.5,0.5,B,0.55,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_h1,combinatorics,combinations,A,0.0,0.8,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_h2,combinatorics,combinations,B,0.0,1.0,A,0.9,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_combinations_h3,combinatorics,combinations,A,1.0,1.0,B,0.55,A,0.99,A,1.0,B
Qwen2.5-Math-7B-Instruct,combinatorics_probability_e1,combinatorics,probability,A and B are equally good,0.0,0.5,B,0.95,B,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,combinatorics_probability_e2,combinatorics,probability,A,1.0,0.8,B,0.95,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_probability_e3,combinatorics,probability,A,0.0,0.9,B,0.75,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_probability_m1,combinatorics,probability,B,1.0,0.85,B,0.9,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_probability_m2,combinatorics,probability,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_probability_m3,combinatorics,probability,A,1.0,1.0,A,0.55,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_probability_h1,combinatorics,probability,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_probability_h2,combinatorics,probability,Tie,0.5,0.5,B,0.51,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_probability_h3,combinatorics,probability,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_e1,combinatorics,recursion,B,0.0,1.0,A,0.6,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_e2,combinatorics,recursion,Tie,0.5,0.5,A,0.95,A,0.98,A,1.0,A
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_e3,combinatorics,recursion,A,1.0,0.9,B,0.6,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_m1,combinatorics,recursion,B,1.0,0.9,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_m2,combinatorics,recursion,A,1.0,0.9,A,0.55,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_m3,combinatorics,recursion,Tie,0.5,0.5,A,0.7,A,0.75,A,1.0,A
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_h1,combinatorics,recursion,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_h2,combinatorics,recursion,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,combinatorics_recursion_h3,combinatorics,recursion,A,0.0,0.9,B,0.95,B,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,statistics_descriptive_e1,statistics,descriptive statistics,A,0.0,0.8,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_descriptive_e2,statistics,descriptive statistics,A,0.0,1.0,B,0.85,B,0.98,B,1.0,B
Qwen2.5-Math-7B-Instruct,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_descriptive_m1,statistics,descriptive statistics,A,0.0,0.9,B,0.6,A,0.95,B,0.7,B
Qwen2.5-Math-7B-Instruct,statistics_descriptive_m2,statistics,descriptive statistics,A,0.0,0.85,B,0.55,A,0.9,B,0.8,A
Qwen2.5-Math-7B-Instruct,statistics_descriptive_m3,statistics,descriptive statistics,A,0.0,1.0,B,0.95,B,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,statistics_descriptive_h1,statistics,descriptive statistics,A,0.0,1.0,B,0.9,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_descriptive_h2,statistics,descriptive statistics,A,1.0,0.9,B,0.8,A,0.85,,,A
Qwen2.5-Math-7B-Instruct,statistics_descriptive_h3,statistics,descriptive statistics,B,0.0,0.9,B,0.55,A,0.95,A,0.9,B
Qwen2.5-Math-7B-Instruct,statistics_distributions_e1,statistics,distributions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_distributions_e2,statistics,distributions,B,1.0,1.0,B,0.85,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_distributions_e3,statistics,distributions,B,1.0,0.8,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_distributions_m1,statistics,distributions,A,1.0,0.8,B,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_distributions_m2,statistics,distributions,B,1.0,0.9,B,0.95,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_distributions_m3,statistics,distributions,A,1.0,0.9,A,0.55,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_distributions_h1,statistics,distributions,Tie,0.5,0.5,A,0.5,B,0.99,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_distributions_h2,statistics,distributions,Tie,0.5,0.5,B,0.6,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_distributions_h3,statistics,distributions,Tie,0.5,0.5,B,0.85,A,0.98,A,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_e1,statistics,hypothesis testing,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_e2,statistics,hypothesis testing,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_e3,statistics,hypothesis testing,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_m1,statistics,hypothesis testing,A,1.0,1.0,A,0.95,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_m2,statistics,hypothesis testing,A,1.0,1.0,A,0.85,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_m3,statistics,hypothesis testing,A,0.0,1.0,B,0.85,B,0.95,A,0.8,B
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_h1,statistics,hypothesis testing,A,1.0,0.85,A,0.85,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_h2,statistics,hypothesis testing,B,0.0,0.95,A,0.85,A,0.95,A,0.9,A
Qwen2.5-Math-7B-Instruct,statistics_hypothesis_h3,statistics,hypothesis testing,A,0.0,0.85,B,0.55,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_regression_e1,statistics,regression,A,1.0,0.9,A,0.85,A,0.95,A,0.9,B
Qwen2.5-Math-7B-Instruct,statistics_regression_e2,statistics,regression,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_regression_e3,statistics,regression,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_regression_m1,statistics,regression,A,0.0,1.0,B,0.95,B,0.99,B,1.0,A
Qwen2.5-Math-7B-Instruct,statistics_regression_m2,statistics,regression,A,0.0,0.85,B,0.51,A,0.95,B,0.8,B
Qwen2.5-Math-7B-Instruct,statistics_regression_m3,statistics,regression,A,0.0,0.9,B,0.75,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_regression_h1,statistics,regression,A,0.0,1.0,B,0.95,A,0.99,B,0.9,B
Qwen2.5-Math-7B-Instruct,statistics_regression_h2,statistics,regression,Tie,0.5,0.5,B,0.85,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,statistics_regression_h3,statistics,regression,Tie,0.5,0.5,B,0.9,B,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_bayesian_e1,statistics,bayesian inference,A,0.0,0.85,B,0.55,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_bayesian_e2,statistics,bayesian inference,A,1.0,0.8,A,0.75,A,0.95,A,0.9,A
Qwen2.5-Math-7B-Instruct,statistics_bayesian_e3,statistics,bayesian inference,A,1.0,0.035699999999999996,A,0.95,A,0.95,A,1.0,B
Qwen2.5-Math-7B-Instruct,statistics_bayesian_m1,statistics,bayesian inference,Tie,0.5,0.5,B,0.5,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,statistics_bayesian_m2,statistics,bayesian inference,Tie,0.5,0.5,B,0.95,A,0.95,B,0.9,B
Qwen2.5-Math-7B-Instruct,statistics_bayesian_m3,statistics,bayesian inference,A,1.0,0.9,A,0.6,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,statistics_bayesian_h1,statistics,bayesian inference,Tie,0.5,0.5,B,0.95,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_bayesian_h2,statistics,bayesian inference,B,1.0,0.7,B,0.9,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,statistics_bayesian_h3,statistics,bayesian inference,A,0.0,0.9,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_e1,linear algebra,matrices,A,0.0,1.0,B,0.9,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_e2,linear algebra,matrices,Tie,0.5,0.5,B,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_e3,linear algebra,matrices,A,0.0,0.85,B,0.85,B,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_m1,linear algebra,matrices,A,0.0,0.9,B,0.8,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_m2,linear algebra,matrices,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_m3,linear algebra,matrices,B,0.0,0.85,A,0.95,B,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_h1,linear algebra,matrices,B,1.0,0.9,B,0.85,A,0.95,B,0.9,B
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_h2,linear algebra,matrices,A,0.0,1.0,B,0.55,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_matrices_h3,linear algebra,matrices,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_e1,linear algebra,determinants,A,0.0,1.0,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_e2,linear algebra,determinants,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_e3,linear algebra,determinants,A,1.0,1.0,B,0.51,A,0.95,A,0.75,A
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_m1,linear algebra,determinants,B,1.0,0.9,B,0.85,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_m2,linear algebra,determinants,Tie,0.5,0.5,B,0.6,B,0.95,B,0.9,B
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_m3,linear algebra,determinants,A,0.0,0.9,B,0.9,A,0.95,B,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_h1,linear algebra,determinants,A,0.0,1.0,B,0.98,B,0.98,B,1.0,A
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_h2,linear algebra,determinants,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_determinants_h3,linear algebra,determinants,A,0.0,1.0,B,0.9,B,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,1.0,0.85,B,0.51,A,0.99,A,1.0,A
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,B,1.0,0.9,B,0.9,B,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,A,1.0,0.9,A,0.55,A,0.95,B,1.0,A
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,Tie,0.5,0.5,B,0.51,A,0.95,B,0.9,A
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,Tie,0.5,0.5,B,0.51,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,A,0.0,1.0,B,0.95,B,0.95,B,1.0,B
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,B,0.0,0.8,A,0.95,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,B,0.0,1.0,A,0.85,A,0.98,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,B,0.0,0.9,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,1.0,0.9,B,0.75,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,0.0,0.55,B,0.85,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,Tie,0.5,0.5,B,1.0,B,0.98,B,1.0,B
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,B,0.0,0.95,A,0.75,A,0.85,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,Tie,0.5,0.5,B,0.85,B,0.95,,,A
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_e1,linear algebra,linear transformations,B,1.0,0.95,B,0.85,B,0.95,A,0.9,A
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_e2,linear algebra,linear transformations,Tie,0.5,0.5,A,0.85,A,0.95,A,1.0,A
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_e3,linear algebra,linear transformations,A,1.0,0.9,A,0.55,A,0.95,A,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_m1,linear algebra,linear transformations,B,0.0,1.0,A,0.65,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_m2,linear algebra,linear transformations,Tie,0.5,0.5,B,0.6,A,0.95,B,0.95,B
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_m3,linear algebra,linear transformations,A,1.0,1.0,A,0.6,A,0.95,A,0.95,A
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_h1,linear algebra,linear transformations,Tie,0.5,0.5,B,0.85,B,0.95,,,A
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_h2,linear algebra,linear transformations,A,1.0,0.9,A,0.85,A,0.85,A,0.8,B
Qwen2.5-Math-7B-Instruct,linearalgebra_transformations_h3,linear algebra,linear transformations,A,1.0,0.6,B,0.85,A,0.98,A,0.95,B
Llama-3.1-8B-Instruct,arithmetic_basic_operations_e1,arithmetic,basic operations,A,1.0,0.95,A,0.9,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,arithmetic_basic_operations_e2,arithmetic,basic operations,A,1.0,0.8,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_basic_operations_e3,arithmetic,basic operations,B,1.0,0.8,B,0.95,B,0.95,B,0.9,B
Llama-3.1-8B-Instruct,arithmetic_basic_operations_m1,arithmetic,basic operations,B,1.0,0.8,B,0.95,B,0.9,B,1.0,A
Llama-3.1-8B-Instruct,arithmetic_basic_operations_m2,arithmetic,basic operations,A,0.0,0.9,B,0.85,B,0.9,A,0.9,B
Llama-3.1-8B-Instruct,arithmetic_basic_operations_m3,arithmetic,basic operations,B,1.0,0.8,B,0.95,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,arithmetic_basic_operations_h1,arithmetic,basic operations,A,0.0,0.9,B,0.65,B,0.85,B,0.9,B
Llama-3.1-8B-Instruct,arithmetic_basic_operations_h2,arithmetic,basic operations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_basic_operations_h3,arithmetic,basic operations,B,1.0,0.8,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_fractions_e1,arithmetic,fractions,B,0.0,0.85,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_fractions_e2,arithmetic,fractions,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_fractions_e3,arithmetic,fractions,B,0.0,0.95,B,0.9,A,0.9,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_fractions_m1,arithmetic,fractions,B,1.0,0.9,B,0.9,B,0.98,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_fractions_m2,arithmetic,fractions,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_fractions_m3,arithmetic,fractions,B,0.0,0.9,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_fractions_h1,arithmetic,fractions,A,0.0,0.85,B,1.0,B,0.95,B,1.0,A
Llama-3.1-8B-Instruct,arithmetic_fractions_h2,arithmetic,fractions,A,0.0,0.95,B,0.95,B,0.9,B,1.0,A
Llama-3.1-8B-Instruct,arithmetic_fractions_h3,arithmetic,fractions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_percentages_e1,arithmetic,percentages,B,1.0,0.8,B,1.0,B,0.95,B,1.0,A
Llama-3.1-8B-Instruct,arithmetic_percentages_e2,arithmetic,percentages,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,arithmetic_percentages_e3,arithmetic,percentages,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_percentages_m1,arithmetic,percentages,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_percentages_m2,arithmetic,percentages,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_percentages_m3,arithmetic,percentages,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_percentages_h1,arithmetic,percentages,A,1.0,0.8,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,arithmetic_percentages_h2,arithmetic,percentages,B,1.0,0.9,B,0.98,B,0.98,A,0.7,A
Llama-3.1-8B-Instruct,arithmetic_percentages_h3,arithmetic,percentages,A,0.0,0.85,B,0.95,B,0.9,B,1.0,A
Llama-3.1-8B-Instruct,arithmetic_numerical_e1,arithmetic,numerical approximation,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,arithmetic_numerical_e2,arithmetic,numerical approximation,A,0.0,0.9,B,0.9,A,0.95,B,1.0,A
Llama-3.1-8B-Instruct,arithmetic_numerical_e3,arithmetic,numerical approximation,B,1.0,0.8,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_numerical_m1,arithmetic,numerical approximation,A,1.0,0.8,A,0.65,B,0.85,A,0.8,A
Llama-3.1-8B-Instruct,arithmetic_numerical_m2,arithmetic,numerical approximation,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,0.9,A,0.95,A,0.95,A,0.9,A
Llama-3.1-8B-Instruct,arithmetic_numerical_h1,arithmetic,numerical approximation,B,0.0,0.8,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_numerical_h2,arithmetic,numerical approximation,A,0.0,0.9,B,0.8,B,0.92,B,0.9,B
Llama-3.1-8B-Instruct,arithmetic_numerical_h3,arithmetic,numerical approximation,A,1.0,0.8,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,arithmetic_order_e1,arithmetic,order of operations,A,0.0,0.95,B,1.0,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,arithmetic_order_e2,arithmetic,order of operations,A,1.0,0.85,A,1.0,A,1.0,A,1.0,A
Llama-3.1-8B-Instruct,arithmetic_order_e3,arithmetic,order of operations,A,1.0,0.9,A,0.98,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,arithmetic_order_m1,arithmetic,order of operations,B,1.0,1.0,B,1.0,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_order_m2,arithmetic,order of operations,A,1.0,0.9,A,1.0,A,1.0,A,1.0,A
Llama-3.1-8B-Instruct,arithmetic_order_m3,arithmetic,order of operations,B,1.0,0.9,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,arithmetic_order_h1,arithmetic,order of operations,A,0.0,0.9,B,1.0,B,1.0,B,1.0,A
Llama-3.1-8B-Instruct,arithmetic_order_h2,arithmetic,order of operations,B,1.0,0.9,B,0.95,B,0.95,A,0.95,B
Llama-3.1-8B-Instruct,arithmetic_order_h3,arithmetic,order of operations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_equations_e1,algebra,equations,B,1.0,0.85,B,1.0,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,algebra_equations_e2,algebra,equations,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_equations_e3,algebra,equations,A,1.0,0.9,A,0.98,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,algebra_equations_m1,algebra,equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,algebra_equations_m2,algebra,equations,B,1.0,0.9,B,0.9,A,0.95,B,0.95,A
Llama-3.1-8B-Instruct,algebra_equations_m3,algebra,equations,A,1.0,0.9,A,1.0,A,0.98,A,0.95,A
Llama-3.1-8B-Instruct,algebra_equations_h1,algebra,equations,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_equations_h2,algebra,equations,A,1.0,0.9,A,0.8,A,0.85,A,0.7,A
Llama-3.1-8B-Instruct,algebra_equations_h3,algebra,equations,B,0.0,0.95,A,0.75,B,0.7,A,0.8,B
Llama-3.1-8B-Instruct,algebra_inequalities_e1,algebra,inequalities,A,0.0,0.9,B,1.0,B,0.98,B,1.0,A
Llama-3.1-8B-Instruct,algebra_inequalities_e2,algebra,inequalities,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,algebra_inequalities_e3,algebra,inequalities,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,algebra_inequalities_m1,algebra,inequalities,B,0.0,0.85,A,0.95,A,0.95,A,0.95,B
Llama-3.1-8B-Instruct,algebra_inequalities_m2,algebra,inequalities,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,algebra_inequalities_m3,algebra,inequalities,A,0.0,0.9,B,0.92,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,algebra_inequalities_h1,algebra,inequalities,A,0.0,0.9,B,0.9,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,algebra_inequalities_h2,algebra,inequalities,B,1.0,0.9,B,0.85,B,0.95,B,0.7,B
Llama-3.1-8B-Instruct,algebra_inequalities_h3,algebra,inequalities,A,1.0,0.85,B,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_polynomials_e1,algebra,polynomials,A,1.0,0.8,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_polynomials_e2,algebra,polynomials,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_polynomials_e3,algebra,polynomials,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_polynomials_m1,algebra,polynomials,B,0.0,0.9,A,1.0,A,0.95,A,0.9,A
Llama-3.1-8B-Instruct,algebra_polynomials_m2,algebra,polynomials,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,algebra_polynomials_m3,algebra,polynomials,A,0.0,0.95,B,0.85,B,0.9,B,0.9,B
Llama-3.1-8B-Instruct,algebra_polynomials_h1,algebra,polynomials,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,algebra_polynomials_h2,algebra,polynomials,B,1.0,0.95,A,0.6,B,0.7,B,0.7,A
Llama-3.1-8B-Instruct,algebra_polynomials_h3,algebra,polynomials,B,1.0,0.8,B,0.85,A,0.7,B,0.7,A
Llama-3.1-8B-Instruct,algebra_functions_e1,algebra,functions,B,1.0,0.95,B,1.0,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,algebra_functions_e2,algebra,functions,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,algebra_functions_e3,algebra,functions,B,0.0,1.0,A,1.0,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_functions_m1,algebra,functions,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_functions_m2,algebra,functions,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,algebra_functions_m3,algebra,functions,A,0.0,0.95,A,0.85,B,0.9,B,0.95,B
Llama-3.1-8B-Instruct,algebra_functions_h1,algebra,functions,A,0.0,0.95,B,1.0,A,0.95,B,1.0,A
Llama-3.1-8B-Instruct,algebra_functions_h2,algebra,functions,A,0.0,0.9,B,0.75,B,0.85,A,0.9,A
Llama-3.1-8B-Instruct,algebra_functions_h3,algebra,functions,B,0.0,0.8,A,1.0,A,0.98,A,0.95,A
Llama-3.1-8B-Instruct,algebra_systems_e1,algebra,systems of equations,A,1.0,1.0,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,algebra_systems_e2,algebra,systems of equations,B,1.0,0.95,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,algebra_systems_e3,algebra,systems of equations,A,1.0,0.9,A,1.0,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,algebra_systems_m1,algebra,systems of equations,A,1.0,0.95,A,0.85,A,0.9,A,0.8,A
Llama-3.1-8B-Instruct,algebra_systems_m2,algebra,systems of equations,A,0.0,0.9,B,0.85,B,0.95,A,0.95,B
Llama-3.1-8B-Instruct,algebra_systems_m3,algebra,systems of equations,A,1.0,0.9,A,0.85,A,1.0,A,1.0,B
Llama-3.1-8B-Instruct,algebra_systems_h1,algebra,systems of equations,A,0.0,0.8,A,0.85,B,0.92,B,0.95,A
Llama-3.1-8B-Instruct,algebra_systems_h2,algebra,systems of equations,A,0.0,0.8,B,0.95,B,0.9,B,0.8,A
Llama-3.1-8B-Instruct,algebra_systems_h3,algebra,systems of equations,A,1.0,0.9,A,1.0,A,0.65,A,1.0,B
Llama-3.1-8B-Instruct,calculus_differentiation_e1,calculus,differentiation,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Llama-3.1-8B-Instruct,calculus_differentiation_e2,calculus,differentiation,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,calculus_differentiation_m1,calculus,differentiation,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,calculus_differentiation_m2,calculus,differentiation,B,0.0,0.9,A,0.95,A,0.95,A,0.95,B
Llama-3.1-8B-Instruct,calculus_differentiation_m3,calculus,differentiation,A,1.0,0.7,A,0.85,A,0.9,A,0.7,A
Llama-3.1-8B-Instruct,calculus_differentiation_h1,calculus,differentiation,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,calculus_differentiation_h2,calculus,differentiation,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,calculus_differentiation_h3,calculus,differentiation,A,0.0,0.9,B,0.85,B,0.9,B,0.7,B
Llama-3.1-8B-Instruct,calculus_integration_e1,calculus,integration,B,1.0,0.9,B,0.95,B,0.9,B,0.9,B
Llama-3.1-8B-Instruct,calculus_integration_e2,calculus,integration,B,1.0,0.95,B,0.65,B,0.85,,,B
Llama-3.1-8B-Instruct,calculus_integration_e3,calculus,integration,A,1.0,0.9,A,0.98,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,calculus_integration_m1,calculus,integration,A,1.0,0.95,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,calculus_integration_m2,calculus,integration,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,calculus_integration_m3,calculus,integration,B,0.0,0.9,A,1.0,A,1.0,A,1.0,A
Llama-3.1-8B-Instruct,calculus_integration_h1,calculus,integration,B,1.0,0.8,B,0.75,B,0.85,B,0.6,A
Llama-3.1-8B-Instruct,calculus_integration_h2,calculus,integration,A,0.0,0.8,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,calculus_integration_h3,calculus,integration,B,0.0,0.95,A,0.7,A,0.85,A,0.6,A
Llama-3.1-8B-Instruct,calculus_limits_e1,calculus,limits,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,calculus_limits_e2,calculus,limits,B,1.0,0.9,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,calculus_limits_e3,calculus,limits,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,calculus_limits_m1,calculus,limits,A,0.0,0.95,B,0.98,B,0.98,B,0.95,B
Llama-3.1-8B-Instruct,calculus_limits_m2,calculus,limits,B,0.0,0.8,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,calculus_limits_m3,calculus,limits,B,1.0,0.9,B,0.98,B,0.98,B,1.0,B
Llama-3.1-8B-Instruct,calculus_limits_h1,calculus,limits,A,1.0,0.8,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,calculus_limits_h2,calculus,limits,A,0.0,0.6,B,0.9,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,calculus_limits_h3,calculus,limits,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,calculus_series_e1,calculus,series,A,1.0,0.9,B,0.85,A,0.95,A,0.95,B
Llama-3.1-8B-Instruct,calculus_series_e2,calculus,series,B,1.0,0.8,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,calculus_series_e3,calculus,series,B,1.0,0.9,B,0.95,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,calculus_series_m1,calculus,series,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,calculus_series_m2,calculus,series,A,0.0,0.9,B,0.95,B,0.85,B,0.95,A
Llama-3.1-8B-Instruct,calculus_series_m3,calculus,series,A,0.0,0.9,B,0.85,B,0.85,B,0.7,B
Llama-3.1-8B-Instruct,calculus_series_h1,calculus,series,A,0.0,0.9,B,1.0,B,0.98,B,0.95,A
Llama-3.1-8B-Instruct,calculus_series_h2,calculus,series,A,1.0,0.9,A,0.85,A,0.98,A,0.9,A
Llama-3.1-8B-Instruct,calculus_series_h3,calculus,series,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Llama-3.1-8B-Instruct,calculus_applications_e1,calculus,applications,B,1.0,0.9,B,1.0,B,0.98,B,1.0,B
Llama-3.1-8B-Instruct,calculus_applications_e2,calculus,applications,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,calculus_applications_e3,calculus,applications,B,0.0,1.0,A,0.85,B,0.75,A,0.95,B
Llama-3.1-8B-Instruct,calculus_applications_m1,calculus,applications,B,0.0,0.85,A,0.65,B,0.95,A,0.95,A
Llama-3.1-8B-Instruct,calculus_applications_m2,calculus,applications,A,1.0,0.95,A,1.0,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,calculus_applications_m3,calculus,applications,A,0.0,0.9,B,0.95,B,0.99,B,1.0,A
Llama-3.1-8B-Instruct,calculus_applications_h1,calculus,applications,A,0.0,0.9,B,0.85,B,1.0,B,0.7,B
Llama-3.1-8B-Instruct,calculus_applications_h2,calculus,applications,B,0.0,0.95,A,1.0,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,calculus_applications_h3,calculus,applications,A,1.0,0.95,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,geometry_plane_e1,geometry,plane geometry,A,1.0,0.95,A,1.0,A,1.0,A,1.0,A
Llama-3.1-8B-Instruct,geometry_plane_e2,geometry,plane geometry,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_plane_e3,geometry,plane geometry,A,1.0,1.0,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,geometry_plane_m1,geometry,plane geometry,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,geometry_plane_m2,geometry,plane geometry,B,1.0,0.9,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,geometry_plane_m3,geometry,plane geometry,A,0.0,0.9,B,0.85,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,geometry_plane_h1,geometry,plane geometry,A,0.0,0.9,B,0.75,B,0.85,A,0.7,B
Llama-3.1-8B-Instruct,geometry_plane_h2,geometry,plane geometry,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_plane_h3,geometry,plane geometry,A,1.0,0.9,B,0.95,A,0.9,A,0.9,A
Llama-3.1-8B-Instruct,geometry_coordinate_e1,geometry,coordinate geometry,B,1.0,0.9,B,0.98,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_coordinate_e2,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_coordinate_e3,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_coordinate_m1,geometry,coordinate geometry,A,0.0,0.8,B,1.0,B,0.85,B,1.0,B
Llama-3.1-8B-Instruct,geometry_coordinate_m2,geometry,coordinate geometry,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_coordinate_m3,geometry,coordinate geometry,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_coordinate_h1,geometry,coordinate geometry,B,1.0,0.9,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,geometry_coordinate_h2,geometry,coordinate geometry,A,0.0,0.9,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_coordinate_h3,geometry,coordinate geometry,B,1.0,0.95,B,0.85,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,geometry_transformations_e1,geometry,transformations,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_transformations_e2,geometry,transformations,A,1.0,0.8,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_transformations_e3,geometry,transformations,A,1.0,0.85,A,0.95,A,0.95,B,0.95,A
Llama-3.1-8B-Instruct,geometry_transformations_m1,geometry,transformations,A,1.0,0.9,A,1.0,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,geometry_transformations_m2,geometry,transformations,B,1.0,0.9,B,1.0,B,0.95,B,1.0,A
Llama-3.1-8B-Instruct,geometry_transformations_m3,geometry,transformations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_transformations_h1,geometry,transformations,A,1.0,0.9,A,0.95,A,0.9,A,0.9,B
Llama-3.1-8B-Instruct,geometry_transformations_h2,geometry,transformations,B,0.0,0.95,A,0.85,A,0.9,A,0.9,B
Llama-3.1-8B-Instruct,geometry_transformations_h3,geometry,transformations,A,0.0,0.8,B,0.85,B,0.6,B,0.8,B
Llama-3.1-8B-Instruct,geometry_mensuration_e1,geometry,mensuration,A,1.0,0.85,A,1.0,A,0.98,A,0.95,A
Llama-3.1-8B-Instruct,geometry_mensuration_e2,geometry,mensuration,A,1.0,0.85,A,1.0,A,0.99,A,1.0,A
Llama-3.1-8B-Instruct,geometry_mensuration_e3,geometry,mensuration,A,0.0,0.8,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_mensuration_m1,geometry,mensuration,A,1.0,0.9,A,0.85,A,0.85,A,1.0,A
Llama-3.1-8B-Instruct,geometry_mensuration_m2,geometry,mensuration,B,1.0,0.9,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,geometry_mensuration_m3,geometry,mensuration,A,0.0,0.9,B,0.85,B,0.85,A,0.95,B
Llama-3.1-8B-Instruct,geometry_mensuration_h1,geometry,mensuration,A,0.0,0.9,B,0.8,B,0.85,A,0.65,B
Llama-3.1-8B-Instruct,geometry_mensuration_h2,geometry,mensuration,A,0.0,1.0,B,0.7,B,0.85,,,B
Llama-3.1-8B-Instruct,geometry_mensuration_h3,geometry,mensuration,B,1.0,0.8,B,0.85,B,0.85,B,0.7,B
Llama-3.1-8B-Instruct,geometry_trigonometry_e1,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_trigonometry_e2,geometry,trigonometry,B,1.0,0.9,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,geometry_trigonometry_e3,geometry,trigonometry,B,0.0,0.8,B,0.65,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_trigonometry_m1,geometry,trigonometry,B,0.0,0.9,A,0.9,A,0.85,A,0.8,A
Llama-3.1-8B-Instruct,geometry_trigonometry_m2,geometry,trigonometry,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,geometry_trigonometry_m3,geometry,trigonometry,A,0.0,0.95,B,0.95,B,0.85,B,0.95,B
Llama-3.1-8B-Instruct,geometry_trigonometry_h1,geometry,trigonometry,A,1.0,0.9,A,1.0,A,0.98,A,1.0,B
Llama-3.1-8B-Instruct,geometry_trigonometry_h2,geometry,trigonometry,B,1.0,0.6,B,0.75,B,0.75,B,0.7,A
Llama-3.1-8B-Instruct,geometry_trigonometry_h3,geometry,trigonometry,B,1.0,0.9,B,0.99,B,0.98,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_e1,number theory,divisibility,B,1.0,0.8,B,1.0,B,0.99,B,1.0,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_e2,number theory,divisibility,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,numbertheory_divisibility_e3,number theory,divisibility,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_m1,number theory,divisibility,B,1.0,0.9,B,0.75,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_m2,number theory,divisibility,A,0.0,0.9,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_m3,number theory,divisibility,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_h1,number theory,divisibility,A,1.0,0.9,A,0.95,B,0.85,A,1.0,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_h2,number theory,divisibility,B,1.0,0.8,B,0.95,B,0.95,B,0.9,B
Llama-3.1-8B-Instruct,numbertheory_divisibility_h3,number theory,divisibility,A,1.0,0.9,A,0.9,A,0.9,A,0.8,A
Llama-3.1-8B-Instruct,numbertheory_modular_e1,number theory,modular arithmetic,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,numbertheory_modular_e2,number theory,modular arithmetic,A,1.0,0.75,A,0.98,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,numbertheory_modular_e3,number theory,modular arithmetic,A,1.0,0.8,A,0.95,A,0.95,B,0.95,A
Llama-3.1-8B-Instruct,numbertheory_modular_m1,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_modular_m2,number theory,modular arithmetic,A,1.0,0.85,B,0.9,A,0.95,A,0.95,B
Llama-3.1-8B-Instruct,numbertheory_modular_m3,number theory,modular arithmetic,A,0.0,1.0,B,0.95,A,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_modular_h1,number theory,modular arithmetic,A,1.0,0.8,B,0.85,A,0.85,A,0.8,B
Llama-3.1-8B-Instruct,numbertheory_modular_h2,number theory,modular arithmetic,A,1.0,0.85,A,0.85,A,0.85,B,0.8,A
Llama-3.1-8B-Instruct,numbertheory_modular_h3,number theory,modular arithmetic,A,1.0,0.8,A,0.85,B,0.95,A,0.7,B
Llama-3.1-8B-Instruct,numbertheory_primes_e1,number theory,primes,A,0.0,0.9,B,0.95,B,0.9,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_primes_e2,number theory,primes,B,0.0,0.8,A,0.98,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,numbertheory_primes_e3,number theory,primes,A,1.0,0.9,A,1.0,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,numbertheory_primes_m1,number theory,primes,B,0.0,0.9,A,0.95,A,0.85,A,0.95,A
Llama-3.1-8B-Instruct,numbertheory_primes_m2,number theory,primes,A,0.0,0.8,B,0.9,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_primes_m3,number theory,primes,B,1.0,0.8,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,numbertheory_primes_h1,number theory,primes,A,1.0,0.9,B,0.65,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,numbertheory_primes_h2,number theory,primes,B,1.0,0.8,B,1.0,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,numbertheory_primes_h3,number theory,primes,A,1.0,0.9,B,0.75,A,0.95,A,0.95,B
Llama-3.1-8B-Instruct,numbertheory_diophantine_e1,number theory,diophantine equations,B,1.0,0.9,B,0.6,B,0.7,A,0.7,B
Llama-3.1-8B-Instruct,numbertheory_diophantine_e2,number theory,diophantine equations,A,0.0,0.9,B,0.9,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_diophantine_e3,number theory,diophantine equations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Llama-3.1-8B-Instruct,numbertheory_diophantine_m1,number theory,diophantine equations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
Llama-3.1-8B-Instruct,numbertheory_diophantine_m2,number theory,diophantine equations,B,1.0,0.95,B,1.0,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,numbertheory_diophantine_m3,number theory,diophantine equations,A,1.0,0.8,A,0.95,A,0.65,A,0.7,B
Llama-3.1-8B-Instruct,numbertheory_diophantine_h1,number theory,diophantine equations,B,0.0,0.9,A,0.7,B,0.85,A,0.7,A
Llama-3.1-8B-Instruct,numbertheory_diophantine_h2,number theory,diophantine equations,B,1.0,0.9,B,0.75,B,0.9,A,0.6,A
Llama-3.1-8B-Instruct,numbertheory_diophantine_h3,number theory,diophantine equations,B,0.0,0.9,A,0.9,A,0.95,A,0.6,A
Llama-3.1-8B-Instruct,numbertheory_sequences_e1,number theory,number sequences,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_sequences_e2,number theory,number sequences,A,0.0,0.9,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,numbertheory_sequences_e3,number theory,number sequences,B,1.0,0.9,B,0.95,B,0.99,B,0.9,B
Llama-3.1-8B-Instruct,numbertheory_sequences_m1,number theory,number sequences,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_sequences_m2,number theory,number sequences,B,1.0,0.85,B,0.75,A,0.5,B,0.7,A
Llama-3.1-8B-Instruct,numbertheory_sequences_m3,number theory,number sequences,A,0.0,0.85,B,0.9,A,0.95,B,0.95,B
Llama-3.1-8B-Instruct,numbertheory_sequences_h1,number theory,number sequences,A,1.0,0.9,A,1.0,A,0.99,A,0.95,B
Llama-3.1-8B-Instruct,numbertheory_sequences_h2,number theory,number sequences,A,1.0,0.95,A,0.65,A,0.85,A,0.7,B
Llama-3.1-8B-Instruct,numbertheory_sequences_h3,number theory,number sequences,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,combinatorics_counting_e1,combinatorics,counting principles,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_counting_e2,combinatorics,counting principles,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_counting_e3,combinatorics,counting principles,A,0.0,0.9,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_counting_m1,combinatorics,counting principles,A,1.0,0.9,A,0.9,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,combinatorics_counting_m2,combinatorics,counting principles,A,0.0,0.9,A,0.85,B,0.9,B,0.8,B
Llama-3.1-8B-Instruct,combinatorics_counting_m3,combinatorics,counting principles,A,1.0,0.9,A,1.0,A,1.0,A,1.0,A
Llama-3.1-8B-Instruct,combinatorics_counting_h1,combinatorics,counting principles,B,0.0,0.8,B,0.75,A,0.5,A,0.6,A
Llama-3.1-8B-Instruct,combinatorics_counting_h2,combinatorics,counting principles,A,1.0,0.9,A,0.85,B,0.98,A,0.95,A
Llama-3.1-8B-Instruct,combinatorics_counting_h3,combinatorics,counting principles,A,0.0,0.95,B,0.65,B,0.95,B,0.65,B
Llama-3.1-8B-Instruct,combinatorics_permutations_e1,combinatorics,permutations,B,0.0,0.8,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,combinatorics_permutations_e2,combinatorics,permutations,A,0.0,0.9,B,0.9,A,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_permutations_e3,combinatorics,permutations,A,0.0,0.8,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_permutations_m1,combinatorics,permutations,B,1.0,0.95,B,0.95,B,0.98,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_permutations_m2,combinatorics,permutations,A,0.0,0.9,B,1.0,B,0.95,B,1.0,A
Llama-3.1-8B-Instruct,combinatorics_permutations_m3,combinatorics,permutations,A,0.0,1.0,A,0.75,B,0.9,B,1.0,A
Llama-3.1-8B-Instruct,combinatorics_permutations_h1,combinatorics,permutations,A,0.0,0.8,B,0.85,B,1.0,B,0.7,B
Llama-3.1-8B-Instruct,combinatorics_permutations_h2,combinatorics,permutations,A,0.0,0.9,B,0.75,B,0.85,B,0.7,B
Llama-3.1-8B-Instruct,combinatorics_permutations_h3,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.7,A,0.6,A
Llama-3.1-8B-Instruct,combinatorics_combinations_e1,combinatorics,combinations,A,0.0,0.9,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_combinations_e2,combinatorics,combinations,B,1.0,0.8,B,0.95,B,0.95,A,0.95,B
Llama-3.1-8B-Instruct,combinatorics_combinations_e3,combinatorics,combinations,A,0.0,0.9,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_combinations_m1,combinatorics,combinations,B,1.0,0.9,B,0.95,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,combinatorics_combinations_m2,combinatorics,combinations,A,1.0,0.9,A,1.0,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,combinatorics_combinations_m3,combinatorics,combinations,B,0.0,1.0,B,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,combinatorics_combinations_h1,combinatorics,combinations,B,0.0,0.95,A,0.75,A,0.6,A,0.7,A
Llama-3.1-8B-Instruct,combinatorics_combinations_h2,combinatorics,combinations,B,1.0,0.95,B,1.0,B,0.95,B,1.0,A
Llama-3.1-8B-Instruct,combinatorics_combinations_h3,combinatorics,combinations,A,1.0,0.8,A,1.0,A,1.0,A,0.9,A
Llama-3.1-8B-Instruct,combinatorics_probability_e1,combinatorics,probability,A,0.0,0.8,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_probability_e2,combinatorics,probability,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_probability_e3,combinatorics,probability,A,1.0,0.95,A,1.0,A,1.0,A,1.0,A
Llama-3.1-8B-Instruct,combinatorics_probability_m1,combinatorics,probability,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_probability_m2,combinatorics,probability,B,1.0,0.95,B,1.0,B,0.98,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_probability_m3,combinatorics,probability,A,1.0,0.8,A,0.85,A,0.9,A,0.95,B
Llama-3.1-8B-Instruct,combinatorics_probability_h1,combinatorics,probability,B,0.0,0.9,B,0.6,A,0.9,A,1.0,B
Llama-3.1-8B-Instruct,combinatorics_probability_h2,combinatorics,probability,B,1.0,0.9,B,0.85,B,0.85,,,B
Llama-3.1-8B-Instruct,combinatorics_probability_h3,combinatorics,probability,A,0.0,0.9,B,0.8,B,1.0,B,0.7,B
Llama-3.1-8B-Instruct,combinatorics_recursion_e1,combinatorics,recursion,B,1.0,0.9,B,0.98,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_recursion_e2,combinatorics,recursion,A,0.0,0.9,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_recursion_e3,combinatorics,recursion,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,combinatorics_recursion_m1,combinatorics,recursion,A,1.0,0.9,A,1.0,A,0.99,A,1.0,A
Llama-3.1-8B-Instruct,combinatorics_recursion_m2,combinatorics,recursion,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,combinatorics_recursion_m3,combinatorics,recursion,B,1.0,0.9,B,0.65,B,0.85,A,0.7,A
Llama-3.1-8B-Instruct,combinatorics_recursion_h1,combinatorics,recursion,B,1.0,0.8,B,1.0,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_recursion_h2,combinatorics,recursion,B,1.0,0.8,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,combinatorics_recursion_h3,combinatorics,recursion,A,0.0,0.95,B,0.65,B,0.95,B,0.6,B
Llama-3.1-8B-Instruct,statistics_descriptive_e1,statistics,descriptive statistics,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,0.9,A,0.95,A,0.95,B,0.95,A
Llama-3.1-8B-Instruct,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,0.85,A,0.95,A,0.95,A,0.8,A
Llama-3.1-8B-Instruct,statistics_descriptive_m1,statistics,descriptive statistics,A,1.0,0.9,A,0.85,A,0.95,A,0.8,A
Llama-3.1-8B-Instruct,statistics_descriptive_m2,statistics,descriptive statistics,A,1.0,0.95,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,statistics_descriptive_m3,statistics,descriptive statistics,A,0.0,0.9,B,0.9,B,0.85,B,0.7,B
Llama-3.1-8B-Instruct,statistics_descriptive_h1,statistics,descriptive statistics,A,1.0,0.9,A,0.95,A,0.95,A,0.9,A
Llama-3.1-8B-Instruct,statistics_descriptive_h2,statistics,descriptive statistics,A,1.0,0.9,A,0.95,A,0.85,A,0.7,A
Llama-3.1-8B-Instruct,statistics_descriptive_h3,statistics,descriptive statistics,B,1.0,0.9,B,0.85,B,0.95,,,B
Llama-3.1-8B-Instruct,statistics_distributions_e1,statistics,distributions,A,1.0,0.9,A,1.0,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,statistics_distributions_e2,statistics,distributions,A,1.0,0.9,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,statistics_distributions_e3,statistics,distributions,A,0.0,0.85,B,0.85,A,0.95,B,0.95,B
Llama-3.1-8B-Instruct,statistics_distributions_m1,statistics,distributions,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
Llama-3.1-8B-Instruct,statistics_distributions_m2,statistics,distributions,A,0.0,0.9,B,0.95,B,0.98,B,0.95,B
Llama-3.1-8B-Instruct,statistics_distributions_m3,statistics,distributions,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,statistics_distributions_h1,statistics,distributions,A,0.0,0.9,B,0.98,B,0.95,B,1.0,A
Llama-3.1-8B-Instruct,statistics_distributions_h2,statistics,distributions,A,1.0,0.9,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,statistics_distributions_h3,statistics,distributions,B,1.0,0.8,B,0.75,B,0.9,B,0.7,B
Llama-3.1-8B-Instruct,statistics_hypothesis_e1,statistics,hypothesis testing,A,0.0,0.9,B,0.9,B,0.9,A,0.95,B
Llama-3.1-8B-Instruct,statistics_hypothesis_e2,statistics,hypothesis testing,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,statistics_hypothesis_e3,statistics,hypothesis testing,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,statistics_hypothesis_m1,statistics,hypothesis testing,B,1.0,0.8,B,1.0,B,0.98,B,1.0,B
Llama-3.1-8B-Instruct,statistics_hypothesis_m2,statistics,hypothesis testing,A,0.0,0.85,B,0.95,B,0.95,B,0.85,B
Llama-3.1-8B-Instruct,statistics_hypothesis_m3,statistics,hypothesis testing,B,0.0,0.9,A,0.75,A,0.85,A,0.7,B
Llama-3.1-8B-Instruct,statistics_hypothesis_h1,statistics,hypothesis testing,B,0.0,0.9,A,0.85,A,0.85,A,0.6,A
Llama-3.1-8B-Instruct,statistics_hypothesis_h2,statistics,hypothesis testing,B,1.0,0.8,B,0.65,B,0.85,B,0.6,B
Llama-3.1-8B-Instruct,statistics_hypothesis_h3,statistics,hypothesis testing,A,1.0,0.9,A,0.98,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,statistics_regression_e1,statistics,regression,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,statistics_regression_e2,statistics,regression,A,1.0,0.8,A,0.98,A,1.0,A,1.0,A
Llama-3.1-8B-Instruct,statistics_regression_e3,statistics,regression,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,statistics_regression_m1,statistics,regression,A,1.0,0.95,A,0.95,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,statistics_regression_m2,statistics,regression,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,statistics_regression_m3,statistics,regression,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,statistics_regression_h1,statistics,regression,A,1.0,0.9,A,0.9,B,0.95,A,1.0,A
Llama-3.1-8B-Instruct,statistics_regression_h2,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Llama-3.1-8B-Instruct,statistics_regression_h3,statistics,regression,B,1.0,0.9,B,0.85,B,0.9,B,0.9,B
Llama-3.1-8B-Instruct,statistics_bayesian_e1,statistics,bayesian inference,A,1.0,0.8,A,1.0,A,0.98,A,1.0,A
Llama-3.1-8B-Instruct,statistics_bayesian_e2,statistics,bayesian inference,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Llama-3.1-8B-Instruct,statistics_bayesian_e3,statistics,bayesian inference,A,1.0,0.8,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,statistics_bayesian_m1,statistics,bayesian inference,A,1.0,0.9,A,0.9,B,0.95,A,0.85,B
Llama-3.1-8B-Instruct,statistics_bayesian_m2,statistics,bayesian inference,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,statistics_bayesian_m3,statistics,bayesian inference,A,0.0,0.9,B,1.0,B,0.99,B,1.0,B
Llama-3.1-8B-Instruct,statistics_bayesian_h1,statistics,bayesian inference,A,1.0,0.9,A,0.85,A,0.85,A,0.7,A
Llama-3.1-8B-Instruct,statistics_bayesian_h2,statistics,bayesian inference,A,0.0,0.95,B,0.75,B,0.85,B,0.8,B
Llama-3.1-8B-Instruct,statistics_bayesian_h3,statistics,bayesian inference,A,1.0,0.9,A,0.9,A,0.85,A,0.8,B
Llama-3.1-8B-Instruct,linearalgebra_matrices_e1,linear algebra,matrices,B,1.0,0.8,B,0.85,B,0.95,B,0.95,B
Llama-3.1-8B-Instruct,linearalgebra_matrices_e2,linear algebra,matrices,B,1.0,1.0,B,1.0,B,0.98,B,0.95,B
Llama-3.1-8B-Instruct,linearalgebra_matrices_e3,linear algebra,matrices,B,1.0,0.9,B,0.98,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_matrices_m1,linear algebra,matrices,A,1.0,0.9,A,0.98,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,linearalgebra_matrices_m2,linear algebra,matrices,A,0.0,0.85,B,0.85,B,0.85,B,0.9,A
Llama-3.1-8B-Instruct,linearalgebra_matrices_m3,linear algebra,matrices,A,0.0,0.9,B,0.75,B,0.85,B,0.95,B
Llama-3.1-8B-Instruct,linearalgebra_matrices_h1,linear algebra,matrices,A,0.0,0.95,B,0.95,B,0.95,B,0.9,A
Llama-3.1-8B-Instruct,linearalgebra_matrices_h2,linear algebra,matrices,B,1.0,0.9,B,0.85,B,0.95,,,B
Llama-3.1-8B-Instruct,linearalgebra_matrices_h3,linear algebra,matrices,A,0.0,0.8,A,0.8,B,0.9,B,0.7,A
Llama-3.1-8B-Instruct,linearalgebra_determinants_e1,linear algebra,determinants,A,1.0,1.0,A,0.85,A,0.85,A,0.9,A
Llama-3.1-8B-Instruct,linearalgebra_determinants_e2,linear algebra,determinants,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_determinants_e3,linear algebra,determinants,A,0.0,0.8,A,0.85,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_determinants_m1,linear algebra,determinants,B,1.0,0.8,B,0.75,B,0.8,B,0.7,B
Llama-3.1-8B-Instruct,linearalgebra_determinants_m2,linear algebra,determinants,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_determinants_m3,linear algebra,determinants,A,0.0,0.95,B,0.65,A,0.95,B,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_determinants_h1,linear algebra,determinants,B,1.0,0.9,B,0.85,B,0.9,A,0.8,B
Llama-3.1-8B-Instruct,linearalgebra_determinants_h2,linear algebra,determinants,B,0.0,0.85,A,0.98,A,0.95,A,0.9,A
Llama-3.1-8B-Instruct,linearalgebra_determinants_h3,linear algebra,determinants,B,1.0,0.9,B,1.0,B,0.95,B,1.0,A
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,A,0.0,0.9,B,1.0,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,B,1.0,0.9,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,0.9,B,0.85,B,0.9,B,0.6,B
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,A,0.0,0.9,B,0.95,B,0.95,B,0.9,B
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,1.0,0.9,A,0.6,A,0.9,B,0.7,A
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,B,1.0,0.95,B,0.7,B,0.9,B,0.95,B
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,B,1.0,0.85,B,1.0,B,0.98,B,1.0,B
Llama-3.1-8B-Instruct,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,B,1.0,0.9,B,0.8,B,0.7,A,0.6,A
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,A,1.0,0.8,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,1.0,0.85,A,1.0,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,B,1.0,0.9,B,0.95,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.85,A,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,0.0,0.9,B,0.9,A,0.95,B,1.0,B
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,A,0.0,0.9,B,0.95,B,0.95,B,0.9,B
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,B,1.0,0.9,B,1.0,B,0.95,B,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,B,0.0,0.9,A,0.95,A,0.9,A,0.95,B
Llama-3.1-8B-Instruct,linearalgebra_transformations_e1,linear algebra,linear transformations,A,1.0,0.8,A,0.85,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,linearalgebra_transformations_e2,linear algebra,linear transformations,A,1.0,1.0,A,0.95,A,0.9,A,0.95,B
Llama-3.1-8B-Instruct,linearalgebra_transformations_e3,linear algebra,linear transformations,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Llama-3.1-8B-Instruct,linearalgebra_transformations_m1,linear algebra,linear transformations,A,1.0,0.9,A,0.95,A,0.9,A,0.7,A
Llama-3.1-8B-Instruct,linearalgebra_transformations_m2,linear algebra,linear transformations,B,1.0,0.95,B,0.95,B,0.98,B,0.9,A
Llama-3.1-8B-Instruct,linearalgebra_transformations_m3,linear algebra,linear transformations,B,0.0,0.95,A,0.95,A,0.95,B,0.95,A
Llama-3.1-8B-Instruct,linearalgebra_transformations_h1,linear algebra,linear transformations,B,1.0,0.9,B,0.7,B,0.9,A,0.7,B
Llama-3.1-8B-Instruct,linearalgebra_transformations_h2,linear algebra,linear transformations,B,1.0,0.8,B,0.75,B,0.95,B,0.6,A
Llama-3.1-8B-Instruct,linearalgebra_transformations_h3,linear algebra,linear transformations,A,1.0,0.9,A,1.0,A,0.98,A,0.9,A
OpenThinker2-7B,arithmetic_basic_operations_e1,arithmetic,basic operations,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_basic_operations_e2,arithmetic,basic operations,A,0.0,1.0,B,0.95,B,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_basic_operations_e3,arithmetic,basic operations,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_basic_operations_m1,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_basic_operations_m2,arithmetic,basic operations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_basic_operations_m3,arithmetic,basic operations,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,arithmetic_basic_operations_h1,arithmetic,basic operations,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_basic_operations_h2,arithmetic,basic operations,A,1.0,0.95,B,0.85,A,0.98,A,0.9,B
OpenThinker2-7B,arithmetic_basic_operations_h3,arithmetic,basic operations,A,0.0,0.95,B,1.0,A,0.95,B,0.95,B
OpenThinker2-7B,arithmetic_fractions_e1,arithmetic,fractions,A,1.0,1.0,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,arithmetic_fractions_e2,arithmetic,fractions,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_fractions_e3,arithmetic,fractions,A,1.0,0.95,A,0.9,B,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_fractions_m1,arithmetic,fractions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_fractions_m2,arithmetic,fractions,A,0.0,1.0,B,0.95,B,0.95,B,0.95,A
OpenThinker2-7B,arithmetic_fractions_m3,arithmetic,fractions,B,0.0,0.98,B,0.95,A,0.92,A,0.95,A
OpenThinker2-7B,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,1.0,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,arithmetic_fractions_h2,arithmetic,fractions,B,0.0,0.95,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,arithmetic_fractions_h3,arithmetic,fractions,A,1.0,1.0,B,0.95,A,0.95,A,1.0,A
OpenThinker2-7B,arithmetic_percentages_e1,arithmetic,percentages,A,1.0,0.99,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,arithmetic_percentages_e2,arithmetic,percentages,B,1.0,1.0,B,0.85,B,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_percentages_e3,arithmetic,percentages,A,1.0,1.0,B,0.95,A,0.92,A,0.95,A
OpenThinker2-7B,arithmetic_percentages_m1,arithmetic,percentages,B,0.0,0.98,A,0.85,A,0.9,,,A
OpenThinker2-7B,arithmetic_percentages_m2,arithmetic,percentages,B,0.0,1.0,A,0.85,A,0.95,B,0.95,B
OpenThinker2-7B,arithmetic_percentages_m3,arithmetic,percentages,B,1.0,1.0,B,0.92,A,0.95,B,0.95,A
OpenThinker2-7B,arithmetic_percentages_h1,arithmetic,percentages,B,0.0,1.0,B,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,arithmetic_percentages_h2,arithmetic,percentages,A,1.0,0.85,A,1.0,A,0.95,A,1.0,A
OpenThinker2-7B,arithmetic_percentages_h3,arithmetic,percentages,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
OpenThinker2-7B,arithmetic_numerical_e1,arithmetic,numerical approximation,A,1.0,1.0,B,0.95,A,0.95,A,1.0,A
OpenThinker2-7B,arithmetic_numerical_e2,arithmetic,numerical approximation,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_numerical_e3,arithmetic,numerical approximation,A,1.0,0.99,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_numerical_m1,arithmetic,numerical approximation,B,0.0,0.95,A,0.95,A,0.92,A,0.95,A
OpenThinker2-7B,arithmetic_numerical_m2,arithmetic,numerical approximation,B,0.0,0.98,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,1.0,B,0.9,A,0.95,,,A
OpenThinker2-7B,arithmetic_numerical_h1,arithmetic,numerical approximation,A,1.0,0.95,A,1.0,A,0.95,A,0.95,B
OpenThinker2-7B,arithmetic_numerical_h2,arithmetic,numerical approximation,Tie,0.5,0.5,A,0.95,B,0.9,,,B
OpenThinker2-7B,arithmetic_numerical_h3,arithmetic,numerical approximation,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,arithmetic_order_e1,arithmetic,order of operations,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_order_e2,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,arithmetic_order_e3,arithmetic,order of operations,Tie,0.5,0.5,B,0.9,B,0.95,B,0.9,B
OpenThinker2-7B,arithmetic_order_m1,arithmetic,order of operations,A,1.0,0.98,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_order_m2,arithmetic,order of operations,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,arithmetic_order_m3,arithmetic,order of operations,B,0.0,1.0,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,arithmetic_order_h1,arithmetic,order of operations,A,1.0,0.99,B,0.85,A,0.98,A,1.0,B
OpenThinker2-7B,arithmetic_order_h2,arithmetic,order of operations,A,1.0,1.0,A,0.95,A,0.98,A,1.0,B
OpenThinker2-7B,arithmetic_order_h3,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,algebra_equations_e1,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
OpenThinker2-7B,algebra_equations_e2,algebra,equations,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_equations_e3,algebra,equations,B,0.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_equations_m1,algebra,equations,Tie,0.5,0.5,A,0.95,A,0.98,B,0.95,B
OpenThinker2-7B,algebra_equations_m2,algebra,equations,A,1.0,0.95,B,0.95,A,0.95,A,1.0,A
OpenThinker2-7B,algebra_equations_m3,algebra,equations,B,0.0,0.99,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_equations_h1,algebra,equations,A,1.0,1.0,A,0.9,A,0.95,,,B
OpenThinker2-7B,algebra_equations_h2,algebra,equations,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_equations_h3,algebra,equations,B,1.0,0.95,B,0.9,B,0.95,B,0.95,A
OpenThinker2-7B,algebra_inequalities_e1,algebra,inequalities,A,1.0,1.0,A,0.95,A,0.95,B,0.9,A
OpenThinker2-7B,algebra_inequalities_e2,algebra,inequalities,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,algebra_inequalities_e3,algebra,inequalities,A,0.0,0.95,B,0.95,B,0.95,A,0.95,A
OpenThinker2-7B,algebra_inequalities_m1,algebra,inequalities,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
OpenThinker2-7B,algebra_inequalities_m2,algebra,inequalities,B,0.0,0.5,A,0.9,A,0.98,A,0.95,B
OpenThinker2-7B,algebra_inequalities_m3,algebra,inequalities,B,0.0,1.0,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,algebra_inequalities_h1,algebra,inequalities,Tie,0.5,0.5,A,0.85,A,0.98,A,0.95,B
OpenThinker2-7B,algebra_inequalities_h2,algebra,inequalities,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_inequalities_h3,algebra,inequalities,B,0.0,0.98,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_polynomials_e1,algebra,polynomials,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_polynomials_e2,algebra,polynomials,A,1.0,1.0,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,algebra_polynomials_e3,algebra,polynomials,A,1.0,0.98,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_polynomials_m1,algebra,polynomials,A,1.0,1.0,A,0.55,A,0.98,A,1.0,B
OpenThinker2-7B,algebra_polynomials_m2,algebra,polynomials,A,1.0,1.0,B,0.95,A,0.95,A,1.0,A
OpenThinker2-7B,algebra_polynomials_m3,algebra,polynomials,A,1.0,1.0,A,0.95,A,0.95,,,B
OpenThinker2-7B,algebra_polynomials_h1,algebra,polynomials,A,1.0,1.0,A,0.95,B,0.95,,,B
OpenThinker2-7B,algebra_polynomials_h2,algebra,polynomials,A,1.0,1.0,A,0.9,A,0.98,A,0.95,A
OpenThinker2-7B,algebra_polynomials_h3,algebra,polynomials,A,0.0,0.95,B,0.95,B,0.85,A,0.95,A
OpenThinker2-7B,algebra_functions_e1,algebra,functions,A,1.0,1.0,A,0.95,A,0.98,A,1.0,B
OpenThinker2-7B,algebra_functions_e2,algebra,functions,A,1.0,0.95,B,0.8,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_functions_e3,algebra,functions,B,0.0,1.0,A,0.85,B,0.95,A,0.95,A
OpenThinker2-7B,algebra_functions_m1,algebra,functions,A,1.0,1.0,A,0.95,A,0.95,,,B
OpenThinker2-7B,algebra_functions_m2,algebra,functions,B,0.0,1.0,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,algebra_functions_m3,algebra,functions,A,1.0,0.98,A,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_functions_h1,algebra,functions,A,0.0,0.99,B,0.95,B,0.95,B,0.95,A
OpenThinker2-7B,algebra_functions_h2,algebra,functions,B,1.0,0.95,B,0.95,B,0.98,A,0.95,A
OpenThinker2-7B,algebra_functions_h3,algebra,functions,A,1.0,0.95,B,0.85,A,0.92,A,0.9,B
OpenThinker2-7B,algebra_systems_e1,algebra,systems of equations,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_systems_e2,algebra,systems of equations,B,0.0,1.0,B,0.98,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_systems_e3,algebra,systems of equations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_systems_m1,algebra,systems of equations,A,0.0,1.0,B,0.9,B,0.95,A,0.95,B
OpenThinker2-7B,algebra_systems_m2,algebra,systems of equations,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,algebra_systems_m3,algebra,systems of equations,A,1.0,0.98,A,0.9,A,0.95,A,0.95,B
OpenThinker2-7B,algebra_systems_h1,algebra,systems of equations,B,0.0,1.0,A,0.95,A,0.95,B,0.95,B
OpenThinker2-7B,algebra_systems_h2,algebra,systems of equations,B,0.0,1.0,A,0.85,A,0.98,A,0.95,B
OpenThinker2-7B,algebra_systems_h3,algebra,systems of equations,A,0.0,0.9,B,0.95,B,0.95,A,0.95,A
OpenThinker2-7B,calculus_differentiation_e1,calculus,differentiation,A,0.0,1.0,B,0.95,B,0.95,A,0.95,A
OpenThinker2-7B,calculus_differentiation_e2,calculus,differentiation,A,0.0,0.95,B,0.98,B,0.95,B,0.95,A
OpenThinker2-7B,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.99,B,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_differentiation_m1,calculus,differentiation,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
OpenThinker2-7B,calculus_differentiation_m2,calculus,differentiation,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_differentiation_m3,calculus,differentiation,A,1.0,0.98,B,0.92,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_differentiation_h1,calculus,differentiation,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,calculus_differentiation_h2,calculus,differentiation,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,calculus_differentiation_h3,calculus,differentiation,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_integration_e1,calculus,integration,A,1.0,0.99,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_integration_e2,calculus,integration,A,1.0,1.0,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,calculus_integration_e3,calculus,integration,A,1.0,0.98,B,0.95,A,0.95,A,1.0,A
OpenThinker2-7B,calculus_integration_m1,calculus,integration,A,1.0,1.0,A,0.85,A,0.95,A,1.0,A
OpenThinker2-7B,calculus_integration_m2,calculus,integration,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_integration_m3,calculus,integration,A,0.0,0.98,B,0.95,B,0.98,A,0.95,A
OpenThinker2-7B,calculus_integration_h1,calculus,integration,A,1.0,1.0,B,0.92,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_integration_h2,calculus,integration,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,calculus_integration_h3,calculus,integration,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_limits_e1,calculus,limits,A,1.0,1.0,A,0.9,B,0.95,A,0.95,B
OpenThinker2-7B,calculus_limits_e2,calculus,limits,B,0.0,0.95,B,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_limits_e3,calculus,limits,A,1.0,1.0,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,calculus_limits_m1,calculus,limits,B,0.0,1.0,A,0.85,B,0.98,A,0.95,A
OpenThinker2-7B,calculus_limits_m2,calculus,limits,A,1.0,0.99,A,0.95,A,0.98,A,1.0,B
OpenThinker2-7B,calculus_limits_m3,calculus,limits,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_limits_h1,calculus,limits,A,0.0,0.98,B,0.92,B,0.95,A,0.95,A
OpenThinker2-7B,calculus_limits_h2,calculus,limits,B,0.0,0.95,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,calculus_limits_h3,calculus,limits,B,0.0,1.0,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_series_e1,calculus,series,B,0.0,1.0,B,0.92,A,0.98,A,0.95,A
OpenThinker2-7B,calculus_series_e2,calculus,series,B,0.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_series_e3,calculus,series,B,0.0,0.98,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,calculus_series_m1,calculus,series,Tie,0.5,0.5,B,0.85,A,0.95,A,1.0,A
OpenThinker2-7B,calculus_series_m2,calculus,series,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_series_m3,calculus,series,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,calculus_series_h1,calculus,series,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
OpenThinker2-7B,calculus_series_h2,calculus,series,B,1.0,1.0,B,0.95,B,0.95,B,0.95,A
OpenThinker2-7B,calculus_series_h3,calculus,series,A,1.0,0.98,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,calculus_applications_e1,calculus,applications,A,1.0,1.0,A,0.95,A,0.95,,,B
OpenThinker2-7B,calculus_applications_e2,calculus,applications,B,0.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,calculus_applications_e3,calculus,applications,B,0.0,0.98,A,0.95,B,0.95,A,1.0,B
OpenThinker2-7B,calculus_applications_m1,calculus,applications,A,0.0,0.9,B,0.6,B,0.95,B,0.95,B
OpenThinker2-7B,calculus_applications_m2,calculus,applications,A,1.0,1.0,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,calculus_applications_m3,calculus,applications,A,1.0,0.99,A,0.95,A,0.95,B,0.95,B
OpenThinker2-7B,calculus_applications_h1,calculus,applications,A,1.0,0.95,A,0.85,A,0.98,A,0.95,B
OpenThinker2-7B,calculus_applications_h2,calculus,applications,A,1.0,1.0,B,0.9,A,0.95,A,0.9,A
OpenThinker2-7B,calculus_applications_h3,calculus,applications,B,1.0,0.98,B,0.95,B,0.95,B,0.95,B
OpenThinker2-7B,geometry_plane_e1,geometry,plane geometry,B,0.0,0.95,B,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_plane_e2,geometry,plane geometry,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_plane_e3,geometry,plane geometry,B,0.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_plane_m1,geometry,plane geometry,Tie,0.5,0.5,A,1.0,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_plane_m2,geometry,plane geometry,A,0.0,1.0,B,0.85,B,0.95,A,0.95,B
OpenThinker2-7B,geometry_plane_m3,geometry,plane geometry,A,1.0,0.95,A,0.95,B,0.95,,,B
OpenThinker2-7B,geometry_plane_h1,geometry,plane geometry,A,1.0,0.98,B,0.85,A,0.92,A,0.95,A
OpenThinker2-7B,geometry_plane_h2,geometry,plane geometry,B,1.0,1.0,B,0.95,B,0.95,B,0.95,B
OpenThinker2-7B,geometry_plane_h3,geometry,plane geometry,B,0.0,1.0,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,geometry_coordinate_e1,geometry,coordinate geometry,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_coordinate_e2,geometry,coordinate geometry,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_coordinate_e3,geometry,coordinate geometry,B,0.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_coordinate_m1,geometry,coordinate geometry,A,0.0,0.95,B,0.85,B,0.95,A,0.85,A
OpenThinker2-7B,geometry_coordinate_m2,geometry,coordinate geometry,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_coordinate_m3,geometry,coordinate geometry,A,1.0,1.0,A,0.85,B,0.95,A,0.95,B
OpenThinker2-7B,geometry_coordinate_h1,geometry,coordinate geometry,B,0.0,1.0,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_coordinate_h2,geometry,coordinate geometry,B,0.0,1.0,A,0.9,A,0.98,A,1.0,B
OpenThinker2-7B,geometry_coordinate_h3,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,geometry_transformations_e1,geometry,transformations,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,geometry_transformations_e2,geometry,transformations,A,1.0,0.99,A,0.95,A,0.98,,,B
OpenThinker2-7B,geometry_transformations_e3,geometry,transformations,A,1.0,1.0,B,0.95,A,0.95,A,1.0,A
OpenThinker2-7B,geometry_transformations_m1,geometry,transformations,A,1.0,0.99,A,0.85,B,0.98,A,0.95,A
OpenThinker2-7B,geometry_transformations_m2,geometry,transformations,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,geometry_transformations_m3,geometry,transformations,A,0.0,1.0,B,0.85,B,0.95,A,0.9,A
OpenThinker2-7B,geometry_transformations_h1,geometry,transformations,B,0.0,1.0,B,0.6,A,0.98,A,0.95,A
OpenThinker2-7B,geometry_transformations_h2,geometry,transformations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_transformations_h3,geometry,transformations,A,0.0,0.95,B,0.9,B,0.98,A,0.95,A
OpenThinker2-7B,geometry_mensuration_e1,geometry,mensuration,A,1.0,0.95,A,0.85,B,0.98,A,0.95,A
OpenThinker2-7B,geometry_mensuration_e2,geometry,mensuration,A,1.0,0.98,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,geometry_mensuration_e3,geometry,mensuration,A,1.0,1.0,B,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,geometry_mensuration_m1,geometry,mensuration,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
OpenThinker2-7B,geometry_mensuration_m2,geometry,mensuration,B,0.0,1.0,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,geometry_mensuration_m3,geometry,mensuration,A,1.0,0.98,A,0.85,A,0.95,A,1.0,A
OpenThinker2-7B,geometry_mensuration_h1,geometry,mensuration,B,1.0,1.0,B,0.9,B,0.95,B,0.95,B
OpenThinker2-7B,geometry_mensuration_h2,geometry,mensuration,B,0.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_mensuration_h3,geometry,mensuration,B,1.0,0.85,B,0.6,B,0.85,B,0.9,B
OpenThinker2-7B,geometry_trigonometry_e1,geometry,trigonometry,B,1.0,1.0,A,0.8,B,0.95,B,0.95,B
OpenThinker2-7B,geometry_trigonometry_e2,geometry,trigonometry,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,geometry_trigonometry_e3,geometry,trigonometry,A,0.0,1.0,A,0.95,B,0.9,B,0.95,B
OpenThinker2-7B,geometry_trigonometry_m1,geometry,trigonometry,B,0.0,1.0,B,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,geometry_trigonometry_m2,geometry,trigonometry,A,1.0,0.98,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,geometry_trigonometry_m3,geometry,trigonometry,A,1.0,0.9,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,geometry_trigonometry_h1,geometry,trigonometry,Tie,0.5,0.5,A,0.9,A,0.95,,,A
OpenThinker2-7B,geometry_trigonometry_h2,geometry,trigonometry,A,1.0,0.65,A,0.85,B,0.85,A,0.95,A
OpenThinker2-7B,geometry_trigonometry_h3,geometry,trigonometry,A,1.0,1.0,A,1.0,A,0.95,A,1.0,A
OpenThinker2-7B,numbertheory_divisibility_e1,number theory,divisibility,A,1.0,0.98,B,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_divisibility_e2,number theory,divisibility,A,1.0,1.0,B,0.95,A,0.98,A,0.95,A
OpenThinker2-7B,numbertheory_divisibility_e3,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.98,A,1.0,B
OpenThinker2-7B,numbertheory_divisibility_m1,number theory,divisibility,A,1.0,1.0,A,0.95,A,0.98,B,1.0,B
OpenThinker2-7B,numbertheory_divisibility_m2,number theory,divisibility,B,0.0,1.0,A,0.55,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_divisibility_m3,number theory,divisibility,A,1.0,1.0,A,0.9,A,0.98,A,1.0,B
OpenThinker2-7B,numbertheory_divisibility_h1,number theory,divisibility,A,1.0,1.0,A,0.85,A,0.95,A,1.0,B
OpenThinker2-7B,numbertheory_divisibility_h2,number theory,divisibility,A,1.0,0.98,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_divisibility_h3,number theory,divisibility,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_modular_e1,number theory,modular arithmetic,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_modular_e2,number theory,modular arithmetic,A,1.0,0.95,A,0.9,A,0.98,A,1.0,B
OpenThinker2-7B,numbertheory_modular_e3,number theory,modular arithmetic,A,1.0,1.0,A,0.9,B,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_modular_m1,number theory,modular arithmetic,A,1.0,1.0,A,0.95,A,0.98,A,1.0,B
OpenThinker2-7B,numbertheory_modular_m2,number theory,modular arithmetic,A,1.0,1.0,A,0.85,A,0.95,,,A
OpenThinker2-7B,numbertheory_modular_m3,number theory,modular arithmetic,A,1.0,0.95,A,0.7,A,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_modular_h1,number theory,modular arithmetic,B,1.0,1.0,A,0.95,B,0.98,,,B
OpenThinker2-7B,numbertheory_modular_h2,number theory,modular arithmetic,A,1.0,1.0,A,0.85,A,0.98,A,0.95,B
OpenThinker2-7B,numbertheory_modular_h3,number theory,modular arithmetic,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_primes_e1,number theory,primes,A,1.0,1.0,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,numbertheory_primes_e2,number theory,primes,A,0.0,1.0,B,0.85,B,0.95,,,B
OpenThinker2-7B,numbertheory_primes_e3,number theory,primes,A,1.0,0.98,A,0.95,A,0.98,,,B
OpenThinker2-7B,numbertheory_primes_m1,number theory,primes,B,0.0,0.95,A,0.95,A,0.95,,,B
OpenThinker2-7B,numbertheory_primes_m2,number theory,primes,A,1.0,0.95,A,0.9,A,0.95,,,B
OpenThinker2-7B,numbertheory_primes_m3,number theory,primes,B,0.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_primes_h1,number theory,primes,A,1.0,0.99,A,0.9,A,0.95,,,A
OpenThinker2-7B,numbertheory_primes_h2,number theory,primes,B,0.0,1.0,A,0.85,A,0.95,B,0.95,B
OpenThinker2-7B,numbertheory_primes_h3,number theory,primes,A,1.0,1.0,A,0.85,B,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_diophantine_e1,number theory,diophantine equations,A,1.0,0.5,A,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_diophantine_e2,number theory,diophantine equations,B,0.0,0.95,A,0.9,B,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_diophantine_e3,number theory,diophantine equations,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_diophantine_m1,number theory,diophantine equations,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
OpenThinker2-7B,numbertheory_diophantine_m2,number theory,diophantine equations,Tie,0.5,0.5,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_diophantine_m3,number theory,diophantine equations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_diophantine_h1,number theory,diophantine equations,A,1.0,1.0,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,numbertheory_diophantine_h2,number theory,diophantine equations,A,1.0,0.98,A,0.9,B,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_diophantine_h3,number theory,diophantine equations,B,1.0,1.0,B,0.85,B,0.95,,,A
OpenThinker2-7B,numbertheory_sequences_e1,number theory,number sequences,A,1.0,0.5,A,0.85,A,0.95,A,1.0,A
OpenThinker2-7B,numbertheory_sequences_e2,number theory,number sequences,A,1.0,1.0,A,0.85,A,0.95,,,A
OpenThinker2-7B,numbertheory_sequences_e3,number theory,number sequences,B,0.0,0.99,A,0.85,B,0.98,A,0.95,A
OpenThinker2-7B,numbertheory_sequences_m1,number theory,number sequences,B,0.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_sequences_m2,number theory,number sequences,A,1.0,1.0,A,0.85,A,0.95,,,B
OpenThinker2-7B,numbertheory_sequences_m3,number theory,number sequences,A,1.0,1.0,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,numbertheory_sequences_h1,number theory,number sequences,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,numbertheory_sequences_h2,number theory,number sequences,A,1.0,1.0,A,0.9,B,0.98,A,0.95,A
OpenThinker2-7B,numbertheory_sequences_h3,number theory,number sequences,B,0.0,0.98,A,0.85,B,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_counting_e1,combinatorics,counting principles,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,combinatorics_counting_e2,combinatorics,counting principles,A,1.0,0.95,A,0.85,A,0.95,A,1.0,A
OpenThinker2-7B,combinatorics_counting_e3,combinatorics,counting principles,B,1.0,0.98,B,0.95,B,0.98,B,0.95,B
OpenThinker2-7B,combinatorics_counting_m1,combinatorics,counting principles,A,1.0,1.0,A,0.95,A,0.95,B,0.95,A
OpenThinker2-7B,combinatorics_counting_m2,combinatorics,counting principles,Tie,0.5,0.5,B,0.95,B,0.98,A,0.95,B
OpenThinker2-7B,combinatorics_counting_m3,combinatorics,counting principles,B,0.0,0.99,B,0.85,A,0.95,A,1.0,A
OpenThinker2-7B,combinatorics_counting_h1,combinatorics,counting principles,A,1.0,0.95,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,combinatorics_counting_h2,combinatorics,counting principles,A,1.0,1.0,B,0.85,A,0.98,A,0.95,A
OpenThinker2-7B,combinatorics_counting_h3,combinatorics,counting principles,A,0.0,1.0,B,0.9,B,0.98,A,0.95,A
OpenThinker2-7B,combinatorics_permutations_e1,combinatorics,permutations,B,0.0,0.98,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,combinatorics_permutations_e2,combinatorics,permutations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_permutations_e3,combinatorics,permutations,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_permutations_m1,combinatorics,permutations,A,1.0,0.98,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_permutations_m2,combinatorics,permutations,B,0.0,0.95,A,0.92,A,0.95,,,B
OpenThinker2-7B,combinatorics_permutations_m3,combinatorics,permutations,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_permutations_h1,combinatorics,permutations,B,1.0,1.0,A,0.85,B,0.98,,,A
OpenThinker2-7B,combinatorics_permutations_h2,combinatorics,permutations,A,1.0,0.95,A,1.0,A,0.95,A,1.0,A
OpenThinker2-7B,combinatorics_permutations_h3,combinatorics,permutations,Tie,0.5,0.5,A,0.7,A,0.6,A,0.7,B
OpenThinker2-7B,combinatorics_combinations_e1,combinatorics,combinations,B,0.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,combinatorics_combinations_e2,combinatorics,combinations,A,1.0,0.98,A,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,combinatorics_combinations_e3,combinatorics,combinations,A,1.0,1.0,A,0.85,A,0.95,B,0.95,B
OpenThinker2-7B,combinatorics_combinations_m1,combinatorics,combinations,A,1.0,0.9,A,0.85,A,0.98,A,1.0,B
OpenThinker2-7B,combinatorics_combinations_m2,combinatorics,combinations,A,1.0,1.0,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,combinatorics_combinations_m3,combinatorics,combinations,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_combinations_h1,combinatorics,combinations,B,0.0,1.0,A,0.85,A,0.98,A,0.95,B
OpenThinker2-7B,combinatorics_combinations_h2,combinatorics,combinations,B,0.0,1.0,A,0.9,A,0.98,A,1.0,B
OpenThinker2-7B,combinatorics_combinations_h3,combinatorics,combinations,B,0.0,1.0,A,0.95,A,0.98,,,B
OpenThinker2-7B,combinatorics_probability_e1,combinatorics,probability,A,1.0,0.98,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_probability_e2,combinatorics,probability,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_probability_e3,combinatorics,probability,A,1.0,1.0,A,0.95,B,0.95,A,1.0,B
OpenThinker2-7B,combinatorics_probability_m1,combinatorics,probability,A,1.0,1.0,A,0.55,A,0.98,A,0.95,B
OpenThinker2-7B,combinatorics_probability_m2,combinatorics,probability,A,1.0,1.0,A,0.95,A,0.98,A,0.95,B
OpenThinker2-7B,combinatorics_probability_m3,combinatorics,probability,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,combinatorics_probability_h1,combinatorics,probability,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,combinatorics_probability_h2,combinatorics,probability,B,0.0,0.98,A,0.9,B,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_probability_h3,combinatorics,probability,A,0.0,0.95,B,0.9,B,0.95,B,0.9,B
OpenThinker2-7B,combinatorics_recursion_e1,combinatorics,recursion,A,0.0,0.95,A,0.85,B,0.95,,,A
OpenThinker2-7B,combinatorics_recursion_e2,combinatorics,recursion,A,1.0,1.0,A,0.85,A,0.95,,,A
OpenThinker2-7B,combinatorics_recursion_e3,combinatorics,recursion,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_recursion_m1,combinatorics,recursion,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_recursion_m2,combinatorics,recursion,A,0.0,1.0,B,0.95,B,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_recursion_m3,combinatorics,recursion,A,1.0,1.0,A,0.85,A,0.95,A,1.0,A
OpenThinker2-7B,combinatorics_recursion_h1,combinatorics,recursion,A,1.0,0.98,A,0.95,B,0.95,A,0.95,A
OpenThinker2-7B,combinatorics_recursion_h2,combinatorics,recursion,A,1.0,0.99,B,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,combinatorics_recursion_h3,combinatorics,recursion,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_descriptive_e1,statistics,descriptive statistics,A,0.0,0.98,B,0.95,B,0.95,,,B
OpenThinker2-7B,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_descriptive_e3,statistics,descriptive statistics,B,0.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_descriptive_m1,statistics,descriptive statistics,A,1.0,1.0,A,0.95,A,0.98,A,0.9,A
OpenThinker2-7B,statistics_descriptive_m2,statistics,descriptive statistics,A,0.0,0.99,B,0.9,B,0.98,A,0.95,A
OpenThinker2-7B,statistics_descriptive_m3,statistics,descriptive statistics,Tie,0.5,0.5,B,0.9,B,0.85,A,0.95,B
OpenThinker2-7B,statistics_descriptive_h1,statistics,descriptive statistics,B,0.0,0.5,B,0.85,A,0.95,A,0.8,B
OpenThinker2-7B,statistics_descriptive_h2,statistics,descriptive statistics,A,1.0,1.0,B,0.95,A,0.85,A,0.95,A
OpenThinker2-7B,statistics_descriptive_h3,statistics,descriptive statistics,Tie,0.5,0.5,A,0.95,A,0.95,B,0.95,A
OpenThinker2-7B,statistics_distributions_e1,statistics,distributions,A,1.0,0.95,A,0.95,B,0.95,,,B
OpenThinker2-7B,statistics_distributions_e2,statistics,distributions,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,statistics_distributions_e3,statistics,distributions,A,1.0,0.99,A,0.9,A,0.95,A,0.95,B
OpenThinker2-7B,statistics_distributions_m1,statistics,distributions,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_distributions_m2,statistics,distributions,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,statistics_distributions_m3,statistics,distributions,B,1.0,1.0,B,0.98,B,0.95,B,0.95,B
OpenThinker2-7B,statistics_distributions_h1,statistics,distributions,A,0.0,1.0,A,0.85,B,0.95,,,B
OpenThinker2-7B,statistics_distributions_h2,statistics,distributions,A,1.0,0.95,B,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,statistics_distributions_h3,statistics,distributions,B,1.0,0.95,A,0.85,B,0.95,,,B
OpenThinker2-7B,statistics_hypothesis_e1,statistics,hypothesis testing,B,1.0,0.98,B,0.85,B,0.95,A,0.9,A
OpenThinker2-7B,statistics_hypothesis_e2,statistics,hypothesis testing,B,0.0,0.95,A,0.85,A,0.95,,,B
OpenThinker2-7B,statistics_hypothesis_e3,statistics,hypothesis testing,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_hypothesis_m1,statistics,hypothesis testing,A,1.0,0.98,A,0.9,B,0.95,A,0.95,A
OpenThinker2-7B,statistics_hypothesis_m2,statistics,hypothesis testing,A,1.0,0.95,B,1.0,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_hypothesis_m3,statistics,hypothesis testing,A,0.0,1.0,B,0.75,B,0.92,B,0.9,B
OpenThinker2-7B,statistics_hypothesis_h1,statistics,hypothesis testing,A,0.0,0.95,B,0.95,B,0.95,A,0.95,A
OpenThinker2-7B,statistics_hypothesis_h2,statistics,hypothesis testing,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
OpenThinker2-7B,statistics_hypothesis_h3,statistics,hypothesis testing,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,statistics_regression_e1,statistics,regression,B,0.0,1.0,A,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_regression_e2,statistics,regression,B,1.0,1.0,B,0.95,B,0.98,B,0.95,A
OpenThinker2-7B,statistics_regression_e3,statistics,regression,A,1.0,0.95,A,0.85,A,0.95,A,0.9,B
OpenThinker2-7B,statistics_regression_m1,statistics,regression,A,1.0,0.98,A,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,statistics_regression_m2,statistics,regression,B,0.0,0.95,A,0.95,A,0.98,B,0.9,B
OpenThinker2-7B,statistics_regression_m3,statistics,regression,A,1.0,0.9,A,0.85,A,0.98,A,1.0,B
OpenThinker2-7B,statistics_regression_h1,statistics,regression,B,0.0,0.99,A,0.9,A,0.95,A,0.95,B
OpenThinker2-7B,statistics_regression_h2,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,,,B
OpenThinker2-7B,statistics_regression_h3,statistics,regression,B,0.0,0.99,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_bayesian_e1,statistics,bayesian inference,A,0.0,0.95,B,0.85,B,0.95,,,B
OpenThinker2-7B,statistics_bayesian_e2,statistics,bayesian inference,B,0.0,0.95,B,0.92,A,0.95,A,0.95,A
OpenThinker2-7B,statistics_bayesian_e3,statistics,bayesian inference,A,1.0,0.95,A,0.85,B,0.98,A,0.95,A
OpenThinker2-7B,statistics_bayesian_m1,statistics,bayesian inference,A,1.0,1.0,A,0.95,A,0.95,,,B
OpenThinker2-7B,statistics_bayesian_m2,statistics,bayesian inference,A,1.0,1.0,A,0.9,A,0.98,,,B
OpenThinker2-7B,statistics_bayesian_m3,statistics,bayesian inference,B,1.0,1.0,B,0.92,B,0.98,A,0.9,A
OpenThinker2-7B,statistics_bayesian_h1,statistics,bayesian inference,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,B
OpenThinker2-7B,statistics_bayesian_h2,statistics,bayesian inference,A,0.0,0.9,B,0.6,A,0.85,B,0.85,A
OpenThinker2-7B,statistics_bayesian_h3,statistics,bayesian inference,A,1.0,0.95,A,0.98,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_matrices_e1,linear algebra,matrices,B,1.0,0.5,B,0.95,B,0.98,,,A
OpenThinker2-7B,linearalgebra_matrices_e2,linear algebra,matrices,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_matrices_e3,linear algebra,matrices,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_matrices_m1,linear algebra,matrices,A,1.0,1.0,A,1.0,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_matrices_m2,linear algebra,matrices,Tie,0.5,0.5,A,0.85,A,0.95,A,1.0,B
OpenThinker2-7B,linearalgebra_matrices_m3,linear algebra,matrices,A,1.0,0.95,A,1.0,A,0.98,,,A
OpenThinker2-7B,linearalgebra_matrices_h1,linear algebra,matrices,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_matrices_h2,linear algebra,matrices,A,1.0,0.99,A,0.95,B,0.95,,,B
OpenThinker2-7B,linearalgebra_matrices_h3,linear algebra,matrices,A,1.0,1.0,A,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_determinants_e1,linear algebra,determinants,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_determinants_e2,linear algebra,determinants,B,0.0,1.0,B,0.85,A,0.98,A,1.0,B
OpenThinker2-7B,linearalgebra_determinants_e3,linear algebra,determinants,A,1.0,0.98,A,0.9,A,0.98,A,1.0,B
OpenThinker2-7B,linearalgebra_determinants_m1,linear algebra,determinants,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_determinants_m2,linear algebra,determinants,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
OpenThinker2-7B,linearalgebra_determinants_m3,linear algebra,determinants,B,0.0,0.95,A,0.85,A,0.98,B,1.0,B
OpenThinker2-7B,linearalgebra_determinants_h1,linear algebra,determinants,A,0.0,0.98,B,0.95,B,0.95,B,0.95,A
OpenThinker2-7B,linearalgebra_determinants_h2,linear algebra,determinants,B,0.0,0.95,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_determinants_h3,linear algebra,determinants,A,1.0,0.95,A,0.95,B,0.95,A,1.0,B
OpenThinker2-7B,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,1.0,0.98,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,B,0.0,0.95,A,0.95,A,0.95,A,1.0,B
OpenThinker2-7B,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,B,0.0,0.95,B,0.75,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,1.0,A,0.85,B,0.95,B,0.95,B
OpenThinker2-7B,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,B,1.0,1.0,B,0.9,B,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,1.0,0.95,A,0.95,A,0.85,A,0.95,A
OpenThinker2-7B,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,Tie,0.5,0.5,B,0.85,B,0.95,,,B
OpenThinker2-7B,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,1.0,0.98,A,0.85,A,0.95,B,0.9,B
OpenThinker2-7B,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,A,0.0,0.95,B,0.95,B,0.9,B,0.9,A
OpenThinker2-7B,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.95,B,0.95,B
OpenThinker2-7B,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,1.0,1.0,B,0.95,A,0.95,A,0.98,A
OpenThinker2-7B,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,A,1.0,0.5,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,B,0.0,0.5,A,1.0,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,A,0.0,1.0,B,0.95,B,0.95,B,0.95,A
OpenThinker2-7B,linearalgebra_transformations_e1,linear algebra,linear transformations,B,0.0,1.0,A,0.9,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_transformations_e2,linear algebra,linear transformations,A,1.0,1.0,A,0.9,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_transformations_e3,linear algebra,linear transformations,A,0.0,0.95,B,0.95,B,0.98,B,0.9,A
OpenThinker2-7B,linearalgebra_transformations_m1,linear algebra,linear transformations,A,1.0,1.0,A,0.95,B,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_transformations_m2,linear algebra,linear transformations,A,1.0,1.0,B,0.85,A,0.95,,,A
OpenThinker2-7B,linearalgebra_transformations_m3,linear algebra,linear transformations,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
OpenThinker2-7B,linearalgebra_transformations_h1,linear algebra,linear transformations,B,0.0,1.0,A,0.98,A,0.95,A,0.95,A
OpenThinker2-7B,linearalgebra_transformations_h2,linear algebra,linear transformations,A,1.0,1.0,B,0.85,A,0.95,A,0.95,B
OpenThinker2-7B,linearalgebra_transformations_h3,linear algebra,linear transformations,Tie,0.5,0.5,B,0.9,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_e1,arithmetic,basic operations,B,0.0,0.95,A,0.6,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_e2,arithmetic,basic operations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_e3,arithmetic,basic operations,A,1.0,0.85,A,0.98,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_m1,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_m2,arithmetic,basic operations,A,1.0,0.95,A,1.0,A,0.85,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_m3,arithmetic,basic operations,B,0.0,0.95,A,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_h1,arithmetic,basic operations,A,0.0,0.95,B,0.95,B,0.92,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_h2,arithmetic,basic operations,B,1.0,0.95,A,0.9,B,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_basic_operations_h3,arithmetic,basic operations,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_e1,arithmetic,fractions,A,1.0,0.95,A,0.9,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_e2,arithmetic,fractions,A,1.0,0.9,A,0.95,A,0.9,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_e3,arithmetic,fractions,B,0.0,0.85,A,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_m1,arithmetic,fractions,A,1.0,0.95,B,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_m2,arithmetic,fractions,A,1.0,1.0,A,0.85,A,0.95,B,0.9,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_m3,arithmetic,fractions,A,0.0,0.95,B,0.9,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_h2,arithmetic,fractions,A,0.0,0.95,B,0.85,B,0.98,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_fractions_h3,arithmetic,fractions,A,1.0,0.95,A,1.0,A,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_e1,arithmetic,percentages,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_e2,arithmetic,percentages,B,0.0,0.95,A,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_e3,arithmetic,percentages,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_m1,arithmetic,percentages,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_m2,arithmetic,percentages,A,1.0,0.95,A,0.85,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_m3,arithmetic,percentages,B,0.0,0.85,A,0.85,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_h1,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_h2,arithmetic,percentages,B,0.0,0.95,A,0.95,A,0.9,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_percentages_h3,arithmetic,percentages,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_e1,arithmetic,numerical approximation,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_e2,arithmetic,numerical approximation,A,0.0,0.9,B,0.85,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_e3,arithmetic,numerical approximation,B,0.0,0.95,A,0.95,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_m1,arithmetic,numerical approximation,B,0.0,0.95,A,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_m2,arithmetic,numerical approximation,A,1.0,0.9,A,0.95,A,0.9,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_m3,arithmetic,numerical approximation,B,1.0,0.85,B,0.85,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_h1,arithmetic,numerical approximation,B,0.0,0.9,B,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_h2,arithmetic,numerical approximation,A,0.0,0.95,B,0.85,B,0.9,A,0.75,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_numerical_h3,arithmetic,numerical approximation,A,1.0,0.95,A,0.95,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_e1,arithmetic,order of operations,B,0.0,0.95,A,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_e2,arithmetic,order of operations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_e3,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_m1,arithmetic,order of operations,B,0.0,0.95,A,0.9,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_m2,arithmetic,order of operations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_m3,arithmetic,order of operations,B,0.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_h1,arithmetic,order of operations,A,1.0,0.85,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_h2,arithmetic,order of operations,B,1.0,1.0,A,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,arithmetic_order_h3,arithmetic,order of operations,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_e1,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_e2,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_e3,algebra,equations,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_m1,algebra,equations,A,1.0,0.95,A,0.6,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_m2,algebra,equations,A,1.0,0.85,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_m3,algebra,equations,A,0.0,0.95,A,0.95,B,0.98,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_h1,algebra,equations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_h2,algebra,equations,A,0.0,0.95,B,0.85,B,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,algebra_equations_h3,algebra,equations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_e1,algebra,inequalities,A,1.0,0.95,A,0.95,A,0.95,B,0.9,A
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_e2,algebra,inequalities,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_e3,algebra,inequalities,B,0.0,0.95,A,0.85,A,0.95,B,0.9,B
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_m1,algebra,inequalities,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_m2,algebra,inequalities,A,1.0,0.95,A,0.85,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_m3,algebra,inequalities,A,1.0,1.0,A,0.95,A,0.92,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_h1,algebra,inequalities,A,1.0,0.95,A,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_h2,algebra,inequalities,A,1.0,0.95,A,0.95,A,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,algebra_inequalities_h3,algebra,inequalities,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_e1,algebra,polynomials,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_e2,algebra,polynomials,Tie,0.5,0.5,A,0.9,A,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_e3,algebra,polynomials,A,1.0,0.95,A,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_m1,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_m2,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.95,A,0.9,A
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_m3,algebra,polynomials,A,0.0,0.95,B,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_h1,algebra,polynomials,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_h2,algebra,polynomials,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_polynomials_h3,algebra,polynomials,B,1.0,0.55,B,0.85,B,0.85,A,0.8,A
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_e1,algebra,functions,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_e2,algebra,functions,A,1.0,0.85,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_e3,algebra,functions,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_m1,algebra,functions,A,0.0,0.95,B,0.55,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_m2,algebra,functions,B,0.0,0.95,A,0.95,A,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_m3,algebra,functions,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_h1,algebra,functions,B,0.0,0.95,A,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_h2,algebra,functions,B,0.0,0.95,B,0.85,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,algebra_functions_h3,algebra,functions,B,1.0,0.95,B,0.85,A,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_e1,algebra,systems of equations,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_e2,algebra,systems of equations,A,0.0,0.85,B,1.0,B,0.9,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_e3,algebra,systems of equations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_m1,algebra,systems of equations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_m2,algebra,systems of equations,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_m3,algebra,systems of equations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_h1,algebra,systems of equations,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_h2,algebra,systems of equations,B,0.0,0.95,A,1.0,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,algebra_systems_h3,algebra,systems of equations,A,1.0,1.0,B,0.92,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_e1,calculus,differentiation,A,0.0,0.95,B,0.85,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_e2,calculus,differentiation,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_m1,calculus,differentiation,A,0.0,0.95,B,0.95,B,0.98,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_m2,calculus,differentiation,A,0.0,0.85,B,0.9,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_m3,calculus,differentiation,B,0.0,0.95,A,0.85,A,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_h1,calculus,differentiation,A,0.0,0.95,A,0.95,B,0.98,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_h2,calculus,differentiation,A,1.0,0.95,B,0.85,A,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,calculus_differentiation_h3,calculus,differentiation,A,0.0,0.95,A,0.9,B,0.98,,,A
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_e1,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_e2,calculus,integration,A,0.0,1.0,B,0.85,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_e3,calculus,integration,A,1.0,0.95,B,0.95,A,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_m1,calculus,integration,A,1.0,0.85,A,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_m2,calculus,integration,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_m3,calculus,integration,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_h1,calculus,integration,B,1.0,0.95,B,0.85,B,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_h2,calculus,integration,A,0.0,0.95,B,0.95,B,0.98,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_integration_h3,calculus,integration,A,1.0,0.95,B,0.6,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_e1,calculus,limits,A,0.0,0.95,B,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_e2,calculus,limits,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_e3,calculus,limits,A,0.0,0.85,B,0.95,B,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_m1,calculus,limits,A,1.0,0.95,A,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_m2,calculus,limits,A,0.0,0.85,A,0.85,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_m3,calculus,limits,B,1.0,0.95,A,0.9,B,0.98,B,0.9,A
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_h1,calculus,limits,A,1.0,0.95,A,0.95,A,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_h2,calculus,limits,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_limits_h3,calculus,limits,A,1.0,0.95,B,0.92,A,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,calculus_series_e1,calculus,series,B,1.0,0.95,B,0.98,B,0.95,B,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_series_e2,calculus,series,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_series_e3,calculus,series,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_series_m1,calculus,series,A,0.0,0.95,A,0.95,B,0.92,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_series_m2,calculus,series,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,calculus_series_m3,calculus,series,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_series_h1,calculus,series,B,1.0,0.95,B,0.9,B,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,calculus_series_h2,calculus,series,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_series_h3,calculus,series,A,1.0,0.85,A,0.95,A,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_e1,calculus,applications,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_e2,calculus,applications,A,1.0,0.85,A,0.95,B,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_e3,calculus,applications,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_m1,calculus,applications,A,0.0,0.9,B,0.85,B,0.95,A,0.9,B
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_m2,calculus,applications,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_m3,calculus,applications,A,1.0,0.95,A,0.95,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_h1,calculus,applications,A,0.0,1.0,B,0.9,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_h2,calculus,applications,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,calculus_applications_h3,calculus,applications,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_e1,geometry,plane geometry,A,0.0,0.85,B,0.95,B,0.95,B,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_e2,geometry,plane geometry,A,0.0,0.85,B,0.95,B,0.95,B,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_e3,geometry,plane geometry,A,1.0,0.95,B,0.85,A,0.95,A,0.9,A
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_m1,geometry,plane geometry,A,0.0,1.0,B,0.85,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_m2,geometry,plane geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_m3,geometry,plane geometry,B,0.0,0.95,A,0.85,A,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_h1,geometry,plane geometry,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_h2,geometry,plane geometry,A only,0.0,0.5,A,0.85,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_plane_h3,geometry,plane geometry,A,1.0,0.95,A,1.0,A,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_e1,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_e2,geometry,coordinate geometry,A,1.0,0.95,A,0.9,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_e3,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_m1,geometry,coordinate geometry,A,1.0,0.95,A,0.6,A,0.95,A,0.9,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_m2,geometry,coordinate geometry,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_m3,geometry,coordinate geometry,B,0.0,0.95,A,0.85,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_h1,geometry,coordinate geometry,B,1.0,0.95,B,0.9,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_h2,geometry,coordinate geometry,B,1.0,0.95,B,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_coordinate_h3,geometry,coordinate geometry,A,1.0,0.9,B,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_e1,geometry,transformations,B,1.0,0.85,B,0.9,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_e2,geometry,transformations,B,1.0,0.85,B,0.95,A,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_e3,geometry,transformations,A,1.0,0.95,A,0.9,A,0.98,,,B
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_m1,geometry,transformations,A,1.0,0.85,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_m2,geometry,transformations,B,1.0,0.95,B,0.9,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_m3,geometry,transformations,B,1.0,0.85,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_h1,geometry,transformations,A,1.0,1.0,A,1.0,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_h2,geometry,transformations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_transformations_h3,geometry,transformations,A,1.0,0.95,A,0.95,A,0.75,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_e1,geometry,mensuration,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_e2,geometry,mensuration,A,1.0,0.85,A,0.95,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_e3,geometry,mensuration,A,1.0,0.95,B,0.85,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_m1,geometry,mensuration,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_m2,geometry,mensuration,B,1.0,0.95,B,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_m3,geometry,mensuration,A,1.0,1.0,A,0.55,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_h1,geometry,mensuration,A,0.0,0.85,B,0.92,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_h2,geometry,mensuration,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_mensuration_h3,geometry,mensuration,A,0.0,0.85,B,0.85,B,0.85,A,0.9,B
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_e1,geometry,trigonometry,A,0.0,0.95,B,0.9,B,0.95,B,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_e2,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_e3,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_m1,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_m2,geometry,trigonometry,A,0.0,0.95,B,0.85,A,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_m3,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_h1,geometry,trigonometry,Tie,0.5,0.5,A,0.85,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_h2,geometry,trigonometry,B,1.0,0.95,B,0.85,B,0.85,A,0.9,B
DeepSeek-R1-Distill-Qwen-7B,geometry_trigonometry_h3,geometry,trigonometry,A,0.0,0.95,B,0.85,B,0.95,A,0.85,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_e1,number theory,divisibility,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_e2,number theory,divisibility,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_e3,number theory,divisibility,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_m1,number theory,divisibility,A,0.0,0.95,B,0.85,B,0.92,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_m2,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_m3,number theory,divisibility,A,1.0,0.85,A,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_h1,number theory,divisibility,A,0.0,0.95,B,0.85,B,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_h2,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_divisibility_h3,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_e1,number theory,modular arithmetic,A,1.0,0.85,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_e2,number theory,modular arithmetic,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_e3,number theory,modular arithmetic,A,1.0,0.95,A,0.9,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_m1,number theory,modular arithmetic,Tie,0.5,0.5,B,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_m2,number theory,modular arithmetic,B,0.0,0.95,A,0.95,A,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_m3,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_h1,number theory,modular arithmetic,A,0.0,1.0,B,0.85,B,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_h2,number theory,modular arithmetic,A,0.0,1.0,B,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_modular_h3,number theory,modular arithmetic,A,1.0,0.85,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_e1,number theory,primes,A,0.0,0.9,B,0.85,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_e2,number theory,primes,A,1.0,0.95,A,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_e3,number theory,primes,A,1.0,0.95,A,0.8,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_m1,number theory,primes,B,0.0,0.85,A,0.85,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_m2,number theory,primes,A,0.0,0.95,B,0.85,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_m3,number theory,primes,A,1.0,0.85,B,0.9,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_h1,number theory,primes,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_h2,number theory,primes,A,1.0,1.0,A,0.98,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_primes_h3,number theory,primes,A,1.0,0.85,A,0.95,A,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_e1,number theory,diophantine equations,B,1.0,0.95,B,0.95,B,0.95,B,0.9,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_e2,number theory,diophantine equations,B,1.0,0.95,B,0.8,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_e3,number theory,diophantine equations,B,1.0,0.95,B,0.9,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_m1,number theory,diophantine equations,B,0.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_m2,number theory,diophantine equations,A,0.0,0.95,A,0.85,B,0.95,B,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_m3,number theory,diophantine equations,B,1.0,0.95,B,0.95,B,0.95,A,0.9,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_h1,number theory,diophantine equations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_h2,number theory,diophantine equations,B,1.0,0.85,B,0.85,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_diophantine_h3,number theory,diophantine equations,A,0.0,0.85,A,0.65,B,0.85,B,0.85,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_e1,number theory,number sequences,A,1.0,0.95,A,0.95,A,0.98,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_e2,number theory,number sequences,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_e3,number theory,number sequences,B,0.0,0.95,A,0.95,A,0.95,A,0.9,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_m1,number theory,number sequences,A,1.0,0.85,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_m2,number theory,number sequences,A,0.0,0.95,A,0.85,B,0.98,,,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_m3,number theory,number sequences,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_h1,number theory,number sequences,A,0.0,0.85,B,0.95,B,0.95,B,0.85,A
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_h2,number theory,number sequences,A,1.0,1.0,A,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,numbertheory_sequences_h3,number theory,number sequences,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_e1,combinatorics,counting principles,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_e2,combinatorics,counting principles,A,1.0,0.9,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_e3,combinatorics,counting principles,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_m1,combinatorics,counting principles,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_m2,combinatorics,counting principles,B,1.0,0.95,B,0.75,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_m3,combinatorics,counting principles,B,0.0,0.95,A,0.9,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_h1,combinatorics,counting principles,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_h2,combinatorics,counting principles,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_counting_h3,combinatorics,counting principles,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_e1,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_e2,combinatorics,permutations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_e3,combinatorics,permutations,B,0.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_m1,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.95,B,0.9,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_m2,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_m3,combinatorics,permutations,B,1.0,0.95,B,1.0,B,0.98,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_h1,combinatorics,permutations,A,0.0,1.0,B,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_h2,combinatorics,permutations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_permutations_h3,combinatorics,permutations,B,1.0,0.5,B,0.8,B,0.85,A,0.6,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_e1,combinatorics,combinations,B,0.0,0.95,A,0.9,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_e2,combinatorics,combinations,A,0.0,0.95,B,0.95,B,0.98,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_e3,combinatorics,combinations,B,1.0,0.95,B,0.9,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_m1,combinatorics,combinations,A,0.0,0.95,B,0.9,B,0.98,,,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_m2,combinatorics,combinations,B,0.0,1.0,A,0.95,B,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_m3,combinatorics,combinations,A,1.0,1.0,A,0.85,A,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_h1,combinatorics,combinations,A,1.0,0.85,A,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_h2,combinatorics,combinations,A,0.0,0.95,A,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_combinations_h3,combinatorics,combinations,B,0.0,1.0,A,0.85,A,0.98,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_e1,combinatorics,probability,B,1.0,0.95,B,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_e2,combinatorics,probability,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_e3,combinatorics,probability,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_m1,combinatorics,probability,A,1.0,0.95,B,0.85,A,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_m2,combinatorics,probability,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_m3,combinatorics,probability,A,1.0,0.9,A,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_h1,combinatorics,probability,A,1.0,0.85,A,0.85,A,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_h2,combinatorics,probability,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_probability_h3,combinatorics,probability,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_e1,combinatorics,recursion,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_e2,combinatorics,recursion,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_e3,combinatorics,recursion,B,0.0,0.85,A,1.0,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_m1,combinatorics,recursion,B,0.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_m2,combinatorics,recursion,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_m3,combinatorics,recursion,B,0.0,0.95,A,0.75,B,0.75,A,0.9,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_h1,combinatorics,recursion,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_h2,combinatorics,recursion,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,combinatorics_recursion_h3,combinatorics,recursion,A,0.0,0.85,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_e1,statistics,descriptive statistics,A,0.0,1.0,B,0.9,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,0.95,B,0.6,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,0.95,A,1.0,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_m1,statistics,descriptive statistics,B,1.0,0.95,A,0.85,B,0.98,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_m2,statistics,descriptive statistics,A,0.0,0.95,A,0.95,B,0.95,B,0.85,A
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_m3,statistics,descriptive statistics,A,0.0,0.95,A,0.85,B,0.95,B,0.9,A
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_h1,statistics,descriptive statistics,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_h2,statistics,descriptive statistics,A,1.0,0.95,A,0.85,B,0.75,A,0.8,B
DeepSeek-R1-Distill-Qwen-7B,statistics_descriptive_h3,statistics,descriptive statistics,A,1.0,0.95,A,1.0,A,0.95,B,0.7,A
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_e1,statistics,distributions,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_e2,statistics,distributions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_e3,statistics,distributions,B,0.0,0.95,A,0.85,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_m1,statistics,distributions,B,1.0,0.95,B,0.95,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_m2,statistics,distributions,A,1.0,0.85,A,0.9,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_m3,statistics,distributions,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_h1,statistics,distributions,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_h2,statistics,distributions,A,1.0,0.95,A,0.8,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_distributions_h3,statistics,distributions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_e1,statistics,hypothesis testing,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_e2,statistics,hypothesis testing,A,1.0,0.85,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_e3,statistics,hypothesis testing,B,0.0,0.85,B,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_m1,statistics,hypothesis testing,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_m2,statistics,hypothesis testing,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_m3,statistics,hypothesis testing,B,1.0,0.95,B,0.95,B,0.9,B,0.75,B
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_h1,statistics,hypothesis testing,A,0.0,0.95,B,0.85,B,0.95,B,0.9,B
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_h2,statistics,hypothesis testing,A,1.0,0.95,A,0.85,A,0.95,B,0.9,A
DeepSeek-R1-Distill-Qwen-7B,statistics_hypothesis_h3,statistics,hypothesis testing,B,0.0,0.95,A,0.9,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_e1,statistics,regression,A,0.0,0.95,B,0.95,B,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_e2,statistics,regression,B,1.0,0.85,A,0.85,B,0.95,B,0.9,A
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_e3,statistics,regression,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_m1,statistics,regression,B,0.0,0.95,B,0.95,A,0.95,A,0.9,A
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_m2,statistics,regression,A,0.0,1.0,B,0.85,B,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_m3,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_h1,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_h2,statistics,regression,B,0.0,0.95,A,0.85,B,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,statistics_regression_h3,statistics,regression,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_e1,statistics,bayesian inference,A,1.0,0.95,A,0.8,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_e2,statistics,bayesian inference,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_e3,statistics,bayesian inference,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_m1,statistics,bayesian inference,B,0.0,0.95,A,0.95,A,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_m2,statistics,bayesian inference,B,1.0,0.95,B,0.85,B,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_m3,statistics,bayesian inference,B,0.0,1.0,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_h1,statistics,bayesian inference,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_h2,statistics,bayesian inference,A,1.0,0.85,A,0.95,A,0.9,A,0.9,A
DeepSeek-R1-Distill-Qwen-7B,statistics_bayesian_h3,statistics,bayesian inference,B,0.0,0.95,A,0.85,B,0.98,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_e1,linear algebra,matrices,A,0.0,0.9,B,0.95,B,0.95,A,1.0,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_e2,linear algebra,matrices,A,1.0,0.95,A,0.95,A,0.9,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_e3,linear algebra,matrices,A,1.0,0.95,A,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_m1,linear algebra,matrices,A,1.0,0.95,B,0.9,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_m2,linear algebra,matrices,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_m3,linear algebra,matrices,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_h1,linear algebra,matrices,B,0.0,0.95,A,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_h2,linear algebra,matrices,B,0.0,0.95,B,0.55,A,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_matrices_h3,linear algebra,matrices,A,0.0,0.95,B,0.85,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_e1,linear algebra,determinants,B,1.0,0.9,B,0.9,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_e2,linear algebra,determinants,B,0.0,0.95,A,0.9,A,0.95,B,0.9,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_e3,linear algebra,determinants,A,1.0,1.0,A,0.95,A,0.95,B,0.85,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_m1,linear algebra,determinants,B,0.0,0.95,A,0.95,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_m2,linear algebra,determinants,B,1.0,0.85,B,0.9,B,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_m3,linear algebra,determinants,A,1.0,1.0,A,0.95,A,0.95,B,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_h1,linear algebra,determinants,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_h2,linear algebra,determinants,A,0.0,0.95,A,0.9,B,0.95,,,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_determinants_h3,linear algebra,determinants,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,1.0,0.95,A,0.95,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,0.95,B,0.75,B,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,B,0.0,0.95,A,0.85,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,B,0.0,0.95,B,0.8,A,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,B,1.0,0.95,B,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,1.0,0.85,A,0.6,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,B,0.0,0.95,A,0.85,A,0.92,B,0.85,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,B,0.0,0.95,A,0.85,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,B,0.0,0.95,A,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,B,0.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,A,1.0,0.9,A,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,1.0,0.95,A,0.75,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,A,1.0,0.95,B,0.85,A,0.95,,,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,B,0.0,0.85,A,0.85,A,0.95,B,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,A,0.0,1.0,B,0.85,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_e1,linear algebra,linear transformations,A,1.0,0.85,A,0.95,A,0.95,B,1.0,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_e2,linear algebra,linear transformations,Tie,0.5,0.5,A,0.85,B,0.95,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_e3,linear algebra,linear transformations,B,1.0,0.95,B,0.95,B,0.95,A,0.95,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_m1,linear algebra,linear transformations,B,0.0,0.95,A,0.95,B,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_m2,linear algebra,linear transformations,B,0.0,0.85,A,0.9,A,0.98,A,1.0,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_m3,linear algebra,linear transformations,B,1.0,0.95,A,0.85,B,0.98,,,A
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_h1,linear algebra,linear transformations,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_h2,linear algebra,linear transformations,B,0.0,0.9,A,0.9,A,0.95,A,0.95,B
DeepSeek-R1-Distill-Qwen-7B,linearalgebra_transformations_h3,linear algebra,linear transformations,A,1.0,0.95,A,1.0,A,0.95,A,1.0,A
Bespoke-Stratos-7B,arithmetic_basic_operations_e1,arithmetic,basic operations,B,0.0,0.95,A,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,arithmetic_basic_operations_e2,arithmetic,basic operations,A,0.0,0.95,B,0.95,B,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_basic_operations_e3,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Bespoke-Stratos-7B,arithmetic_basic_operations_m1,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.9,B
Bespoke-Stratos-7B,arithmetic_basic_operations_m2,arithmetic,basic operations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,arithmetic_basic_operations_m3,arithmetic,basic operations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_basic_operations_h1,arithmetic,basic operations,B,1.0,0.95,B,0.95,B,0.98,B,0.95,A
Bespoke-Stratos-7B,arithmetic_basic_operations_h2,arithmetic,basic operations,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_basic_operations_h3,arithmetic,basic operations,B,1.0,0.95,B,0.9,B,0.95,A,0.9,A
Bespoke-Stratos-7B,arithmetic_fractions_e1,arithmetic,fractions,A,0.0,0.95,B,0.95,B,0.98,B,0.95,B
Bespoke-Stratos-7B,arithmetic_fractions_e2,arithmetic,fractions,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_fractions_e3,arithmetic,fractions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_fractions_m1,arithmetic,fractions,B,1.0,0.95,B,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,arithmetic_fractions_m2,arithmetic,fractions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_fractions_m3,arithmetic,fractions,A,0.0,0.95,A,0.85,B,0.95,B,0.95,A
Bespoke-Stratos-7B,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_fractions_h2,arithmetic,fractions,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_fractions_h3,arithmetic,fractions,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,arithmetic_percentages_e1,arithmetic,percentages,B,1.0,0.95,B,0.95,B,0.98,B,0.95,A
Bespoke-Stratos-7B,arithmetic_percentages_e2,arithmetic,percentages,A,0.0,0.95,B,0.85,B,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_percentages_e3,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.9,B,0.95,B
Bespoke-Stratos-7B,arithmetic_percentages_m1,arithmetic,percentages,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_percentages_m2,arithmetic,percentages,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_percentages_m3,arithmetic,percentages,B,1.0,0.95,B,0.95,B,0.98,A,0.95,A
Bespoke-Stratos-7B,arithmetic_percentages_h1,arithmetic,percentages,A,0.0,0.95,B,0.9,A,0.95,B,0.9,A
Bespoke-Stratos-7B,arithmetic_percentages_h2,arithmetic,percentages,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_percentages_h3,arithmetic,percentages,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_numerical_e1,arithmetic,numerical approximation,B,1.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,arithmetic_numerical_e2,arithmetic,numerical approximation,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_numerical_e3,arithmetic,numerical approximation,A,0.0,0.95,B,1.0,B,0.95,B,1.0,B
Bespoke-Stratos-7B,arithmetic_numerical_m1,arithmetic,numerical approximation,B,1.0,0.85,B,0.95,B,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_numerical_m2,arithmetic,numerical approximation,B,1.0,0.95,B,0.85,B,0.95,B,0.95,A
Bespoke-Stratos-7B,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Bespoke-Stratos-7B,arithmetic_numerical_h1,arithmetic,numerical approximation,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_numerical_h2,arithmetic,numerical approximation,B,1.0,0.95,B,0.95,B,0.9,B,0.95,A
Bespoke-Stratos-7B,arithmetic_numerical_h3,arithmetic,numerical approximation,B,0.0,0.95,B,0.9,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_order_e1,arithmetic,order of operations,A,0.0,0.95,B,0.85,B,0.95,A,0.9,B
Bespoke-Stratos-7B,arithmetic_order_e2,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_order_e3,arithmetic,order of operations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Bespoke-Stratos-7B,arithmetic_order_m1,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_order_m2,arithmetic,order of operations,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,arithmetic_order_m3,arithmetic,order of operations,A,1.0,0.95,A,0.9,A,0.95,B,0.95,A
Bespoke-Stratos-7B,arithmetic_order_h1,arithmetic,order of operations,B,0.0,0.98,A,0.95,A,0.98,A,0.95,A
Bespoke-Stratos-7B,arithmetic_order_h2,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,arithmetic_order_h3,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.98,B,0.95,B
Bespoke-Stratos-7B,algebra_equations_e1,algebra,equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_equations_e2,algebra,equations,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
Bespoke-Stratos-7B,algebra_equations_e3,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_equations_m1,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Bespoke-Stratos-7B,algebra_equations_m2,algebra,equations,A,0.0,0.95,B,0.9,B,0.95,B,0.9,B
Bespoke-Stratos-7B,algebra_equations_m3,algebra,equations,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,algebra_equations_h1,algebra,equations,A,0.0,0.95,B,0.85,B,0.95,B,1.0,B
Bespoke-Stratos-7B,algebra_equations_h2,algebra,equations,A,1.0,0.95,A,0.98,A,0.98,A,0.95,A
Bespoke-Stratos-7B,algebra_equations_h3,algebra,equations,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,algebra_inequalities_e1,algebra,inequalities,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_inequalities_e2,algebra,inequalities,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_inequalities_e3,algebra,inequalities,A,0.0,0.85,B,0.85,B,0.95,B,1.0,A
Bespoke-Stratos-7B,algebra_inequalities_m1,algebra,inequalities,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,algebra_inequalities_m2,algebra,inequalities,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,algebra_inequalities_m3,algebra,inequalities,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_inequalities_h1,algebra,inequalities,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,algebra_inequalities_h2,algebra,inequalities,A,0.0,0.95,B,1.0,B,0.95,B,1.0,A
Bespoke-Stratos-7B,algebra_inequalities_h3,algebra,inequalities,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,algebra_polynomials_e1,algebra,polynomials,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_polynomials_e2,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_polynomials_e3,algebra,polynomials,A,0.0,0.95,B,0.9,A,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_polynomials_m1,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_polynomials_m2,algebra,polynomials,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,algebra_polynomials_m3,algebra,polynomials,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_polynomials_h1,algebra,polynomials,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_polynomials_h2,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_polynomials_h3,algebra,polynomials,B,0.0,0.5,B,0.85,A,0.92,A,0.95,A
Bespoke-Stratos-7B,algebra_functions_e1,algebra,functions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_functions_e2,algebra,functions,A,1.0,0.95,A,0.95,A,0.98,A,0.95,A
Bespoke-Stratos-7B,algebra_functions_e3,algebra,functions,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_functions_m1,algebra,functions,B,1.0,0.95,B,0.95,B,0.98,B,0.95,A
Bespoke-Stratos-7B,algebra_functions_m2,algebra,functions,B,0.0,0.95,A,0.75,A,0.95,B,1.0,A
Bespoke-Stratos-7B,algebra_functions_m3,algebra,functions,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_functions_h1,algebra,functions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,algebra_functions_h2,algebra,functions,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_functions_h3,algebra,functions,A,0.0,0.95,B,0.95,A,0.95,B,0.9,B
Bespoke-Stratos-7B,algebra_systems_e1,algebra,systems of equations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,algebra_systems_e2,algebra,systems of equations,A,1.0,0.95,A,0.95,A,0.98,A,0.95,A
Bespoke-Stratos-7B,algebra_systems_e3,algebra,systems of equations,A,0.0,0.95,B,0.95,B,0.98,B,0.95,B
Bespoke-Stratos-7B,algebra_systems_m1,algebra,systems of equations,B,1.0,0.95,B,1.0,B,0.98,B,0.95,B
Bespoke-Stratos-7B,algebra_systems_m2,algebra,systems of equations,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,algebra_systems_m3,algebra,systems of equations,A,1.0,0.95,B,0.85,A,0.98,A,0.95,A
Bespoke-Stratos-7B,algebra_systems_h1,algebra,systems of equations,A,1.0,0.95,A,0.85,A,0.95,B,0.9,A
Bespoke-Stratos-7B,algebra_systems_h2,algebra,systems of equations,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
Bespoke-Stratos-7B,algebra_systems_h3,algebra,systems of equations,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_differentiation_e1,calculus,differentiation,A,1.0,0.9,A,0.9,A,0.95,B,0.95,A
Bespoke-Stratos-7B,calculus_differentiation_e2,calculus,differentiation,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_differentiation_e3,calculus,differentiation,B,1.0,0.95,B,0.95,B,0.99,B,0.95,B
Bespoke-Stratos-7B,calculus_differentiation_m1,calculus,differentiation,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_differentiation_m2,calculus,differentiation,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,calculus_differentiation_m3,calculus,differentiation,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,calculus_differentiation_h1,calculus,differentiation,A,1.0,0.95,A,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,calculus_differentiation_h2,calculus,differentiation,B,1.0,0.95,B,0.85,A,0.95,B,0.9,A
Bespoke-Stratos-7B,calculus_differentiation_h3,calculus,differentiation,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_integration_e1,calculus,integration,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_integration_e2,calculus,integration,B,1.0,0.95,B,0.95,B,0.98,B,0.95,A
Bespoke-Stratos-7B,calculus_integration_e3,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_integration_m1,calculus,integration,B,1.0,0.95,B,0.95,B,0.98,B,0.95,B
Bespoke-Stratos-7B,calculus_integration_m2,calculus,integration,A,1.0,0.95,A,0.9,A,0.95,A,0.9,B
Bespoke-Stratos-7B,calculus_integration_m3,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_integration_h1,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_integration_h2,calculus,integration,A,0.0,0.95,B,0.85,B,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_integration_h3,calculus,integration,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_limits_e1,calculus,limits,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_limits_e2,calculus,limits,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,calculus_limits_e3,calculus,limits,A,0.0,0.95,B,0.9,B,0.95,A,0.8,B
Bespoke-Stratos-7B,calculus_limits_m1,calculus,limits,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Bespoke-Stratos-7B,calculus_limits_m2,calculus,limits,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Bespoke-Stratos-7B,calculus_limits_m3,calculus,limits,A,0.0,0.95,B,0.85,B,0.95,B,0.9,A
Bespoke-Stratos-7B,calculus_limits_h1,calculus,limits,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_limits_h2,calculus,limits,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_limits_h3,calculus,limits,A,1.0,0.95,B,0.85,A,0.9,A,0.95,B
Bespoke-Stratos-7B,calculus_series_e1,calculus,series,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_series_e2,calculus,series,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,calculus_series_e3,calculus,series,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_series_m1,calculus,series,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_series_m2,calculus,series,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_series_m3,calculus,series,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_series_h1,calculus,series,B,1.0,1.0,B,1.0,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_series_h2,calculus,series,A,1.0,0.95,A,0.95,A,0.95,B,0.9,B
Bespoke-Stratos-7B,calculus_series_h3,calculus,series,B,1.0,0.95,B,0.85,A,0.95,B,0.9,A
Bespoke-Stratos-7B,calculus_applications_e1,calculus,applications,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_applications_e2,calculus,applications,B,1.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,calculus_applications_e3,calculus,applications,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_applications_m1,calculus,applications,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Bespoke-Stratos-7B,calculus_applications_m2,calculus,applications,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_applications_m3,calculus,applications,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,calculus_applications_h1,calculus,applications,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,calculus_applications_h2,calculus,applications,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,calculus_applications_h3,calculus,applications,B,0.0,0.95,A,0.95,A,0.85,A,0.95,B
Bespoke-Stratos-7B,geometry_plane_e1,geometry,plane geometry,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_plane_e2,geometry,plane geometry,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_plane_e3,geometry,plane geometry,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_plane_m1,geometry,plane geometry,A,0.0,0.95,B,0.85,B,0.95,B,0.95,A
Bespoke-Stratos-7B,geometry_plane_m2,geometry,plane geometry,B,0.0,0.95,A,0.95,A,0.95,A,0.9,A
Bespoke-Stratos-7B,geometry_plane_m3,geometry,plane geometry,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,geometry_plane_h1,geometry,plane geometry,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,geometry_plane_h2,geometry,plane geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_plane_h3,geometry,plane geometry,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
Bespoke-Stratos-7B,geometry_coordinate_e1,geometry,coordinate geometry,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,geometry_coordinate_e2,geometry,coordinate geometry,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_coordinate_e3,geometry,coordinate geometry,A,0.0,0.95,B,0.9,B,0.95,A,1.0,B
Bespoke-Stratos-7B,geometry_coordinate_m1,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_coordinate_m2,geometry,coordinate geometry,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_coordinate_m3,geometry,coordinate geometry,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,geometry_coordinate_h1,geometry,coordinate geometry,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_coordinate_h2,geometry,coordinate geometry,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_coordinate_h3,geometry,coordinate geometry,B,1.0,0.95,B,0.98,B,0.95,B,1.0,B
Bespoke-Stratos-7B,geometry_transformations_e1,geometry,transformations,A,1.0,0.95,B,0.95,A,0.98,A,0.95,B
Bespoke-Stratos-7B,geometry_transformations_e2,geometry,transformations,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,geometry_transformations_e3,geometry,transformations,B,1.0,0.95,B,0.9,B,0.95,A,1.0,B
Bespoke-Stratos-7B,geometry_transformations_m1,geometry,transformations,B,1.0,0.95,B,0.98,B,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_transformations_m2,geometry,transformations,B,1.0,0.85,B,0.95,B,0.95,B,1.0,B
Bespoke-Stratos-7B,geometry_transformations_m3,geometry,transformations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_transformations_h1,geometry,transformations,A,1.0,0.95,A,0.95,A,0.98,A,0.95,B
Bespoke-Stratos-7B,geometry_transformations_h2,geometry,transformations,B,1.0,0.75,B,0.85,A,0.85,B,0.95,A
Bespoke-Stratos-7B,geometry_transformations_h3,geometry,transformations,A,1.0,0.95,A,0.95,A,0.95,A,0.8,B
Bespoke-Stratos-7B,geometry_mensuration_e1,geometry,mensuration,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
Bespoke-Stratos-7B,geometry_mensuration_e2,geometry,mensuration,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,geometry_mensuration_e3,geometry,mensuration,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_mensuration_m1,geometry,mensuration,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_mensuration_m2,geometry,mensuration,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,geometry_mensuration_m3,geometry,mensuration,A,0.0,0.95,B,0.95,B,0.98,B,0.95,B
Bespoke-Stratos-7B,geometry_mensuration_h1,geometry,mensuration,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_mensuration_h2,geometry,mensuration,A,0.0,0.9,A,0.85,B,0.75,B,0.85,B
Bespoke-Stratos-7B,geometry_mensuration_h3,geometry,mensuration,B,1.0,0.75,B,0.65,B,0.65,B,0.8,A
Bespoke-Stratos-7B,geometry_trigonometry_e1,geometry,trigonometry,B,1.0,0.95,B,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,geometry_trigonometry_e2,geometry,trigonometry,A,0.0,0.95,B,0.9,B,0.95,B,0.9,B
Bespoke-Stratos-7B,geometry_trigonometry_e3,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_trigonometry_m1,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_trigonometry_m2,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_trigonometry_m3,geometry,trigonometry,B,1.0,0.95,B,0.98,B,0.98,B,0.95,B
Bespoke-Stratos-7B,geometry_trigonometry_h1,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,geometry_trigonometry_h2,geometry,trigonometry,B,0.0,0.85,A,0.65,A,0.85,A,0.8,A
Bespoke-Stratos-7B,geometry_trigonometry_h3,geometry,trigonometry,B,1.0,0.85,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_divisibility_e1,number theory,divisibility,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_divisibility_e2,number theory,divisibility,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_divisibility_e3,number theory,divisibility,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_divisibility_m1,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,numbertheory_divisibility_m2,number theory,divisibility,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_divisibility_m3,number theory,divisibility,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_divisibility_h1,number theory,divisibility,A,1.0,0.95,A,0.9,A,0.95,A,0.9,A
Bespoke-Stratos-7B,numbertheory_divisibility_h2,number theory,divisibility,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_divisibility_h3,number theory,divisibility,A,1.0,0.95,A,0.85,B,0.95,A,1.0,B
Bespoke-Stratos-7B,numbertheory_modular_e1,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_modular_e2,number theory,modular arithmetic,B,1.0,0.9,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_modular_e3,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,B,0.9,B
Bespoke-Stratos-7B,numbertheory_modular_m1,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_modular_m2,number theory,modular arithmetic,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_modular_m3,number theory,modular arithmetic,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,numbertheory_modular_h1,number theory,modular arithmetic,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_modular_h2,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_modular_h3,number theory,modular arithmetic,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_primes_e1,number theory,primes,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,numbertheory_primes_e2,number theory,primes,A,0.0,0.95,B,0.85,B,0.95,A,0.9,B
Bespoke-Stratos-7B,numbertheory_primes_e3,number theory,primes,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_primes_m1,number theory,primes,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_primes_m2,number theory,primes,B,1.0,0.95,B,1.0,B,0.98,B,0.95,B
Bespoke-Stratos-7B,numbertheory_primes_m3,number theory,primes,B,0.0,0.85,A,0.85,A,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_primes_h1,number theory,primes,B,1.0,0.95,B,0.85,A,0.95,B,0.9,A
Bespoke-Stratos-7B,numbertheory_primes_h2,number theory,primes,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Bespoke-Stratos-7B,numbertheory_primes_h3,number theory,primes,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_diophantine_e1,number theory,diophantine equations,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_diophantine_e2,number theory,diophantine equations,A,0.0,0.85,B,0.9,A,0.95,B,0.95,A
Bespoke-Stratos-7B,numbertheory_diophantine_e3,number theory,diophantine equations,B,1.0,0.95,B,0.95,B,0.99,B,1.0,B
Bespoke-Stratos-7B,numbertheory_diophantine_m1,number theory,diophantine equations,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_diophantine_m2,number theory,diophantine equations,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_diophantine_m3,number theory,diophantine equations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,numbertheory_diophantine_h1,number theory,diophantine equations,B,1.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_diophantine_h2,number theory,diophantine equations,A,0.0,0.85,B,0.9,A,0.95,B,0.95,A
Bespoke-Stratos-7B,numbertheory_diophantine_h3,number theory,diophantine equations,A,1.0,0.95,B,0.85,A,0.9,A,0.95,A
Bespoke-Stratos-7B,numbertheory_sequences_e1,number theory,number sequences,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_sequences_e2,number theory,number sequences,A,1.0,0.95,A,0.9,A,0.95,A,1.0,A
Bespoke-Stratos-7B,numbertheory_sequences_e3,number theory,number sequences,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_sequences_m1,number theory,number sequences,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,numbertheory_sequences_m2,number theory,number sequences,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,numbertheory_sequences_m3,number theory,number sequences,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Bespoke-Stratos-7B,numbertheory_sequences_h1,number theory,number sequences,A,0.0,0.95,B,0.95,B,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_sequences_h2,number theory,number sequences,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,numbertheory_sequences_h3,number theory,number sequences,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_counting_e1,combinatorics,counting principles,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_counting_e2,combinatorics,counting principles,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,combinatorics_counting_e3,combinatorics,counting principles,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_counting_m1,combinatorics,counting principles,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_counting_m2,combinatorics,counting principles,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_counting_m3,combinatorics,counting principles,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_counting_h1,combinatorics,counting principles,A,1.0,0.95,A,1.0,A,0.98,A,0.95,A
Bespoke-Stratos-7B,combinatorics_counting_h2,combinatorics,counting principles,A,1.0,1.0,A,0.95,A,0.98,A,0.95,B
Bespoke-Stratos-7B,combinatorics_counting_h3,combinatorics,counting principles,A,1.0,1.0,A,0.85,A,0.85,A,0.8,A
Bespoke-Stratos-7B,combinatorics_permutations_e1,combinatorics,permutations,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_permutations_e2,combinatorics,permutations,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,combinatorics_permutations_e3,combinatorics,permutations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_permutations_m1,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.98,A,1.0,B
Bespoke-Stratos-7B,combinatorics_permutations_m2,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,combinatorics_permutations_m3,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.95,B,1.0,B
Bespoke-Stratos-7B,combinatorics_permutations_h1,combinatorics,permutations,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,combinatorics_permutations_h2,combinatorics,permutations,A,0.0,1.0,B,0.95,B,0.98,A,0.95,A
Bespoke-Stratos-7B,combinatorics_permutations_h3,combinatorics,permutations,A,0.0,0.85,B,0.7,A,0.95,B,0.7,B
Bespoke-Stratos-7B,combinatorics_combinations_e1,combinatorics,combinations,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_combinations_e2,combinatorics,combinations,B,1.0,0.95,B,0.95,B,0.98,B,0.95,A
Bespoke-Stratos-7B,combinatorics_combinations_e3,combinatorics,combinations,A,1.0,0.95,B,0.75,A,0.95,A,0.95,B
Bespoke-Stratos-7B,combinatorics_combinations_m1,combinatorics,combinations,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_combinations_m2,combinatorics,combinations,A,1.0,0.95,A,1.0,A,0.99,A,1.0,A
Bespoke-Stratos-7B,combinatorics_combinations_m3,combinatorics,combinations,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
Bespoke-Stratos-7B,combinatorics_combinations_h1,combinatorics,combinations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Bespoke-Stratos-7B,combinatorics_combinations_h2,combinatorics,combinations,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_combinations_h3,combinatorics,combinations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Bespoke-Stratos-7B,combinatorics_probability_e1,combinatorics,probability,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_probability_e2,combinatorics,probability,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,combinatorics_probability_e3,combinatorics,probability,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,combinatorics_probability_m1,combinatorics,probability,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_probability_m2,combinatorics,probability,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,combinatorics_probability_m3,combinatorics,probability,B,1.0,0.95,B,0.9,A,0.95,B,1.0,A
Bespoke-Stratos-7B,combinatorics_probability_h1,combinatorics,probability,A,0.0,0.95,B,0.98,B,0.95,B,1.0,A
Bespoke-Stratos-7B,combinatorics_probability_h2,combinatorics,probability,B,1.0,0.95,B,1.0,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_probability_h3,combinatorics,probability,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_recursion_e1,combinatorics,recursion,B,0.0,0.95,A,0.9,A,0.9,A,0.9,A
Bespoke-Stratos-7B,combinatorics_recursion_e2,combinatorics,recursion,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,combinatorics_recursion_e3,combinatorics,recursion,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,combinatorics_recursion_m1,combinatorics,recursion,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,combinatorics_recursion_m2,combinatorics,recursion,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Bespoke-Stratos-7B,combinatorics_recursion_m3,combinatorics,recursion,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Bespoke-Stratos-7B,combinatorics_recursion_h1,combinatorics,recursion,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,combinatorics_recursion_h2,combinatorics,recursion,B,1.0,0.95,B,0.95,B,0.95,A,0.9,A
Bespoke-Stratos-7B,combinatorics_recursion_h3,combinatorics,recursion,B,1.0,0.95,B,0.95,B,0.92,B,0.9,B
Bespoke-Stratos-7B,statistics_descriptive_e1,statistics,descriptive statistics,B,1.0,0.95,B,0.95,B,0.95,B,0.9,B
Bespoke-Stratos-7B,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,statistics_descriptive_m1,statistics,descriptive statistics,A,1.0,0.95,A,0.98,A,0.9,A,0.95,A
Bespoke-Stratos-7B,statistics_descriptive_m2,statistics,descriptive statistics,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_descriptive_m3,statistics,descriptive statistics,B,1.0,0.85,B,0.95,B,0.75,B,0.9,A
Bespoke-Stratos-7B,statistics_descriptive_h1,statistics,descriptive statistics,A,1.0,0.85,A,0.95,A,0.95,A,1.0,A
Bespoke-Stratos-7B,statistics_descriptive_h2,statistics,descriptive statistics,B,1.0,0.85,B,0.9,B,0.85,A,0.7,B
Bespoke-Stratos-7B,statistics_descriptive_h3,statistics,descriptive statistics,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,statistics_distributions_e1,statistics,distributions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_distributions_e2,statistics,distributions,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,statistics_distributions_e3,statistics,distributions,B,0.0,0.95,A,0.85,A,0.95,A,1.0,B
Bespoke-Stratos-7B,statistics_distributions_m1,statistics,distributions,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_distributions_m2,statistics,distributions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_distributions_m3,statistics,distributions,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_distributions_h1,statistics,distributions,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_distributions_h2,statistics,distributions,B,1.0,0.95,B,0.95,B,0.95,A,0.9,B
Bespoke-Stratos-7B,statistics_distributions_h3,statistics,distributions,A,0.0,0.95,A,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_hypothesis_e1,statistics,hypothesis testing,B,1.0,0.95,B,0.85,B,0.95,B,0.95,A
Bespoke-Stratos-7B,statistics_hypothesis_e2,statistics,hypothesis testing,A,1.0,0.95,B,0.8,A,0.95,A,0.95,B
Bespoke-Stratos-7B,statistics_hypothesis_e3,statistics,hypothesis testing,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,statistics_hypothesis_m1,statistics,hypothesis testing,A,0.0,0.95,B,0.85,A,0.95,B,0.9,B
Bespoke-Stratos-7B,statistics_hypothesis_m2,statistics,hypothesis testing,A,1.0,0.85,A,0.75,A,0.98,A,0.95,A
Bespoke-Stratos-7B,statistics_hypothesis_m3,statistics,hypothesis testing,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Bespoke-Stratos-7B,statistics_hypothesis_h1,statistics,hypothesis testing,A,0.0,0.95,B,0.95,B,0.95,B,0.9,A
Bespoke-Stratos-7B,statistics_hypothesis_h2,statistics,hypothesis testing,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_hypothesis_h3,statistics,hypothesis testing,A,1.0,0.95,A,0.98,A,0.95,A,1.0,A
Bespoke-Stratos-7B,statistics_regression_e1,statistics,regression,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,statistics_regression_e2,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Bespoke-Stratos-7B,statistics_regression_e3,statistics,regression,A,0.0,0.95,B,0.85,B,0.9,B,0.9,B
Bespoke-Stratos-7B,statistics_regression_m1,statistics,regression,B,1.0,0.95,B,0.9,B,0.6,B,0.9,A
Bespoke-Stratos-7B,statistics_regression_m2,statistics,regression,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
Bespoke-Stratos-7B,statistics_regression_m3,statistics,regression,A,0.0,0.95,B,0.75,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_regression_h1,statistics,regression,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,statistics_regression_h2,statistics,regression,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Bespoke-Stratos-7B,statistics_regression_h3,statistics,regression,A,0.0,0.95,B,0.95,B,0.95,B,0.9,B
Bespoke-Stratos-7B,statistics_bayesian_e1,statistics,bayesian inference,A,1.0,0.95,B,0.75,A,0.98,A,0.95,B
Bespoke-Stratos-7B,statistics_bayesian_e2,statistics,bayesian inference,A,0.0,0.95,B,0.85,B,0.95,B,0.9,B
Bespoke-Stratos-7B,statistics_bayesian_e3,statistics,bayesian inference,A,1.0,0.95,A,0.8,A,0.95,A,0.95,B
Bespoke-Stratos-7B,statistics_bayesian_m1,statistics,bayesian inference,A,0.0,0.95,A,0.65,B,0.95,B,0.95,B
Bespoke-Stratos-7B,statistics_bayesian_m2,statistics,bayesian inference,B,0.0,0.95,A,0.85,A,0.95,B,0.95,A
Bespoke-Stratos-7B,statistics_bayesian_m3,statistics,bayesian inference,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,statistics_bayesian_h1,statistics,bayesian inference,A,0.0,0.95,B,0.98,B,0.98,B,1.0,A
Bespoke-Stratos-7B,statistics_bayesian_h2,statistics,bayesian inference,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
Bespoke-Stratos-7B,statistics_bayesian_h3,statistics,bayesian inference,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Bespoke-Stratos-7B,linearalgebra_matrices_e1,linear algebra,matrices,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_matrices_e2,linear algebra,matrices,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Bespoke-Stratos-7B,linearalgebra_matrices_e3,linear algebra,matrices,B,1.0,0.95,B,0.95,B,0.98,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_matrices_m1,linear algebra,matrices,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_matrices_m2,linear algebra,matrices,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Bespoke-Stratos-7B,linearalgebra_matrices_m3,linear algebra,matrices,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_matrices_h1,linear algebra,matrices,B,1.0,0.95,A,0.85,B,0.95,B,0.8,B
Bespoke-Stratos-7B,linearalgebra_matrices_h2,linear algebra,matrices,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_matrices_h3,linear algebra,matrices,B,1.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_determinants_e1,linear algebra,determinants,A,1.0,0.95,B,0.7,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_determinants_e2,linear algebra,determinants,A,0.0,0.95,B,0.85,B,0.95,B,0.9,B
Bespoke-Stratos-7B,linearalgebra_determinants_e3,linear algebra,determinants,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_determinants_m1,linear algebra,determinants,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Bespoke-Stratos-7B,linearalgebra_determinants_m2,linear algebra,determinants,B,1.0,0.95,B,0.95,B,0.85,B,0.95,A
Bespoke-Stratos-7B,linearalgebra_determinants_m3,linear algebra,determinants,A,0.0,0.95,B,0.85,B,0.85,A,0.95,B
Bespoke-Stratos-7B,linearalgebra_determinants_h1,linear algebra,determinants,B,1.0,0.95,B,0.7,B,0.9,A,0.8,B
Bespoke-Stratos-7B,linearalgebra_determinants_h2,linear algebra,determinants,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_determinants_h3,linear algebra,determinants,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Bespoke-Stratos-7B,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,A,1.0,0.95,A,0.9,A,0.95,B,1.0,B
Bespoke-Stratos-7B,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,0.95,B,0.75,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,1.0,0.95,A,1.0,A,0.95,A,1.0,B
Bespoke-Stratos-7B,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,A,1.0,0.98,B,0.95,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,B,1.0,0.95,B,0.95,B,0.75,A,0.9,B
Bespoke-Stratos-7B,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,A,1.0,0.95,A,0.75,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,0.0,0.95,B,0.98,B,0.98,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,B,0.0,0.95,A,0.95,B,0.85,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,A,0.0,0.95,B,0.95,B,0.85,B,0.95,A
Bespoke-Stratos-7B,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_transformations_e1,linear algebra,linear transformations,B,1.0,0.95,A,0.9,B,0.95,B,1.0,A
Bespoke-Stratos-7B,linearalgebra_transformations_e2,linear algebra,linear transformations,A,1.0,0.95,A,0.8,A,0.95,A,0.95,A
Bespoke-Stratos-7B,linearalgebra_transformations_e3,linear algebra,linear transformations,A,0.0,0.98,B,0.95,B,0.98,B,0.95,A
Bespoke-Stratos-7B,linearalgebra_transformations_m1,linear algebra,linear transformations,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_transformations_m2,linear algebra,linear transformations,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Bespoke-Stratos-7B,linearalgebra_transformations_m3,linear algebra,linear transformations,A,1.0,0.95,A,0.85,A,0.95,A,1.0,A
Bespoke-Stratos-7B,linearalgebra_transformations_h1,linear algebra,linear transformations,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
Bespoke-Stratos-7B,linearalgebra_transformations_h2,linear algebra,linear transformations,A,0.0,0.95,B,0.85,B,0.95,B,0.9,B
Bespoke-Stratos-7B,linearalgebra_transformations_h3,linear algebra,linear transformations,A,1.0,0.95,A,0.85,A,0.95,B,0.9,A
JiuZhang3.0-7B,arithmetic_basic_operations_e1,arithmetic,basic operations,Tie,0.5,0.5,B,0.95,B,0.95,B,1.0,A
JiuZhang3.0-7B,arithmetic_basic_operations_e2,arithmetic,basic operations,B,0.0,1.0,A,0.95,A,0.95,B,0.8,B
JiuZhang3.0-7B,arithmetic_basic_operations_e3,arithmetic,basic operations,B,0.0,1.0,A,0.95,B,0.95,A,0.95,B
JiuZhang3.0-7B,arithmetic_basic_operations_m1,arithmetic,basic operations,A,0.0,0.95,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,arithmetic_basic_operations_m2,arithmetic,basic operations,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,arithmetic_basic_operations_m3,arithmetic,basic operations,B,0.0,1.0,A,0.95,A,0.95,B,1.0,B
JiuZhang3.0-7B,arithmetic_basic_operations_h1,arithmetic,basic operations,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,arithmetic_basic_operations_h2,arithmetic,basic operations,Tie,0.5,0.5,B,0.95,B,0.98,B,1.0,B
JiuZhang3.0-7B,arithmetic_basic_operations_h3,arithmetic,basic operations,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,arithmetic_fractions_e1,arithmetic,fractions,Tie,0.5,0.5,A,0.85,B,0.95,A,0.95,A
JiuZhang3.0-7B,arithmetic_fractions_e2,arithmetic,fractions,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,arithmetic_fractions_e3,arithmetic,fractions,B,1.0,1.0,B,0.85,B,0.95,B,0.95,A
JiuZhang3.0-7B,arithmetic_fractions_m1,arithmetic,fractions,B,1.0,1.0,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,arithmetic_fractions_m2,arithmetic,fractions,B,1.0,1.0,B,0.51,A,0.95,B,0.95,A
JiuZhang3.0-7B,arithmetic_fractions_m3,arithmetic,fractions,B,1.0,1.0,B,0.9,B,0.95,B,1.0,B
JiuZhang3.0-7B,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,arithmetic_fractions_h2,arithmetic,fractions,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,arithmetic_fractions_h3,arithmetic,fractions,Tie,0.5,0.5,A,0.95,A,0.98,A,1.0,B
JiuZhang3.0-7B,arithmetic_percentages_e1,arithmetic,percentages,B,1.0,0.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,arithmetic_percentages_e2,arithmetic,percentages,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,arithmetic_percentages_e3,arithmetic,percentages,Tie,0.5,0.5,B,0.98,B,0.98,B,1.0,A
JiuZhang3.0-7B,arithmetic_percentages_m1,arithmetic,percentages,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,arithmetic_percentages_m2,arithmetic,percentages,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,arithmetic_percentages_m3,arithmetic,percentages,Tie,0.5,0.5,B,0.85,B,0.95,B,1.0,B
JiuZhang3.0-7B,arithmetic_percentages_h1,arithmetic,percentages,Tie,0.5,0.5,B,0.65,B,0.95,A,1.0,A
JiuZhang3.0-7B,arithmetic_percentages_h2,arithmetic,percentages,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,B
JiuZhang3.0-7B,arithmetic_percentages_h3,arithmetic,percentages,Tie,0.5,0.5,B,0.7,B,0.95,B,0.95,A
JiuZhang3.0-7B,arithmetic_numerical_e1,arithmetic,numerical approximation,B,0.0,1.0,A,0.95,A,0.95,A,0.95,B
JiuZhang3.0-7B,arithmetic_numerical_e2,arithmetic,numerical approximation,B,1.0,0.9,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,arithmetic_numerical_e3,arithmetic,numerical approximation,A,1.0,1.0,A,0.9,A,0.9,A,0.8,B
JiuZhang3.0-7B,arithmetic_numerical_m1,arithmetic,numerical approximation,B,0.0,1.0,A,1.0,A,0.99,A,1.0,A
JiuZhang3.0-7B,arithmetic_numerical_m2,arithmetic,numerical approximation,B,0.0,1.0,A,1.0,A,0.85,A,0.6,A
JiuZhang3.0-7B,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,arithmetic_numerical_h1,arithmetic,numerical approximation,A,1.0,0.95,A,1.0,A,0.99,A,1.0,B
JiuZhang3.0-7B,arithmetic_numerical_h2,arithmetic,numerical approximation,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,arithmetic_numerical_h3,arithmetic,numerical approximation,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,arithmetic_order_e1,arithmetic,order of operations,Tie,0.5,0.5,B,0.75,A,0.95,A,0.95,B
JiuZhang3.0-7B,arithmetic_order_e2,arithmetic,order of operations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,arithmetic_order_e3,arithmetic,order of operations,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,arithmetic_order_m1,arithmetic,order of operations,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,arithmetic_order_m2,arithmetic,order of operations,B,0.0,1.0,B,0.75,A,1.0,A,0.95,A
JiuZhang3.0-7B,arithmetic_order_m3,arithmetic,order of operations,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,B
JiuZhang3.0-7B,arithmetic_order_h1,arithmetic,order of operations,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,arithmetic_order_h2,arithmetic,order of operations,A,0.0,1.0,B,0.95,B,0.95,B,0.95,A
JiuZhang3.0-7B,arithmetic_order_h3,arithmetic,order of operations,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,algebra_equations_e1,algebra,equations,B,0.0,1.0,B,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_equations_e2,algebra,equations,B,1.0,1.0,B,0.95,B,0.98,B,1.0,B
JiuZhang3.0-7B,algebra_equations_e3,algebra,equations,Tie,0.5,0.5,A,0.9,A,0.95,A,1.0,A
JiuZhang3.0-7B,algebra_equations_m1,algebra,equations,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_equations_m2,algebra,equations,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_equations_m3,algebra,equations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
JiuZhang3.0-7B,algebra_equations_h1,algebra,equations,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_equations_h2,algebra,equations,B,1.0,0.9,A,0.85,B,0.9,,,A
JiuZhang3.0-7B,algebra_equations_h3,algebra,equations,Tie,0.5,0.5,B,0.85,B,0.85,B,0.6,A
JiuZhang3.0-7B,algebra_inequalities_e1,algebra,inequalities,B,0.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,algebra_inequalities_e2,algebra,inequalities,B,0.0,1.0,A,1.0,A,1.0,A,0.95,A
JiuZhang3.0-7B,algebra_inequalities_e3,algebra,inequalities,B,0.0,1.0,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_inequalities_m1,algebra,inequalities,Tie,0.5,0.5,B,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_inequalities_m2,algebra,inequalities,Tie,0.5,0.5,B,0.85,B,1.0,B,0.95,A
JiuZhang3.0-7B,algebra_inequalities_m3,algebra,inequalities,Tie,0.5,0.5,B,0.95,B,0.95,B,0.9,B
JiuZhang3.0-7B,algebra_inequalities_h1,algebra,inequalities,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,algebra_inequalities_h2,algebra,inequalities,Tie,0.5,0.5,A,0.75,A,0.85,,,A
JiuZhang3.0-7B,algebra_inequalities_h3,algebra,inequalities,A,0.0,1.0,B,0.95,B,0.98,B,1.0,A
JiuZhang3.0-7B,algebra_polynomials_e1,algebra,polynomials,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_polynomials_e2,algebra,polynomials,Tie,0.5,0.5,B,0.95,A,0.95,B,1.0,A
JiuZhang3.0-7B,algebra_polynomials_e3,algebra,polynomials,B,1.0,1.0,B,0.85,B,0.95,B,0.95,B
JiuZhang3.0-7B,algebra_polynomials_m1,algebra,polynomials,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_polynomials_m2,algebra,polynomials,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_polynomials_m3,algebra,polynomials,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,algebra_polynomials_h1,algebra,polynomials,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,algebra_polynomials_h2,algebra,polynomials,Tie,0.5,0.5,A,0.7,B,0.85,,,A
JiuZhang3.0-7B,algebra_polynomials_h3,algebra,polynomials,Tie,0.5,0.5,B,0.95,A,0.5,B,0.75,B
JiuZhang3.0-7B,algebra_functions_e1,algebra,functions,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,algebra_functions_e2,algebra,functions,B,0.0,1.0,A,1.0,A,0.95,A,1.0,B
JiuZhang3.0-7B,algebra_functions_e3,algebra,functions,B,0.0,1.0,A,0.51,A,0.95,B,0.9,A
JiuZhang3.0-7B,algebra_functions_m1,algebra,functions,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,algebra_functions_m2,algebra,functions,Tie,0.5,0.5,A,0.9,A,0.95,A,1.0,B
JiuZhang3.0-7B,algebra_functions_m3,algebra,functions,B,1.0,1.0,B,0.85,B,0.95,B,0.9,A
JiuZhang3.0-7B,algebra_functions_h1,algebra,functions,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,algebra_functions_h2,algebra,functions,Tie,0.5,0.5,A,0.85,B,0.95,B,0.95,B
JiuZhang3.0-7B,algebra_functions_h3,algebra,functions,B,0.0,1.0,A,0.85,B,0.6,A,0.8,A
JiuZhang3.0-7B,algebra_systems_e1,algebra,systems of equations,B,1.0,1.0,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,algebra_systems_e2,algebra,systems of equations,A,0.0,1.0,B,0.55,A,0.95,B,0.95,B
JiuZhang3.0-7B,algebra_systems_e3,algebra,systems of equations,B,0.0,1.0,A,0.9,A,0.95,A,0.95,A
JiuZhang3.0-7B,algebra_systems_m1,algebra,systems of equations,B,1.0,1.0,B,0.95,B,0.95,B,0.95,A
JiuZhang3.0-7B,algebra_systems_m2,algebra,systems of equations,A,0.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,algebra_systems_m3,algebra,systems of equations,Tie,0.5,0.5,A,0.95,A,0.85,A,0.4,A
JiuZhang3.0-7B,algebra_systems_h1,algebra,systems of equations,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,algebra_systems_h2,algebra,systems of equations,B,1.0,1.0,B,0.85,B,0.9,A,0.8,B
JiuZhang3.0-7B,algebra_systems_h3,algebra,systems of equations,A,0.0,1.0,B,1.0,B,0.95,B,1.0,B
JiuZhang3.0-7B,calculus_differentiation_e1,calculus,differentiation,Tie,0.5,0.5,A,0.9,A,0.98,A,1.0,A
JiuZhang3.0-7B,calculus_differentiation_e2,calculus,differentiation,B,1.0,1.0,B,0.95,B,0.98,B,1.0,B
JiuZhang3.0-7B,calculus_differentiation_e3,calculus,differentiation,B,0.0,1.0,A,1.0,A,0.95,A,1.0,B
JiuZhang3.0-7B,calculus_differentiation_m1,calculus,differentiation,A,0.0,1.0,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,calculus_differentiation_m2,calculus,differentiation,A,1.0,1.0,A,0.95,A,0.95,A,0.95,B
JiuZhang3.0-7B,calculus_differentiation_m3,calculus,differentiation,Tie,0.5,0.5,B,0.75,A,0.9,A,1.0,B
JiuZhang3.0-7B,calculus_differentiation_h1,calculus,differentiation,B,1.0,0.9,B,0.95,B,0.95,B,1.0,A
JiuZhang3.0-7B,calculus_differentiation_h2,calculus,differentiation,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,calculus_differentiation_h3,calculus,differentiation,B,0.0,0.5,A,0.95,A,0.85,,,A
JiuZhang3.0-7B,calculus_integration_e1,calculus,integration,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,calculus_integration_e2,calculus,integration,B,1.0,1.0,A,0.85,B,0.95,B,1.0,B
JiuZhang3.0-7B,calculus_integration_e3,calculus,integration,Tie,0.5,0.5,A,1.0,A,0.95,A,1.0,A
JiuZhang3.0-7B,calculus_integration_m1,calculus,integration,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,A
JiuZhang3.0-7B,calculus_integration_m2,calculus,integration,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,calculus_integration_m3,calculus,integration,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,calculus_integration_h1,calculus,integration,A,1.0,0.9,A,0.65,B,0.6,,,B
JiuZhang3.0-7B,calculus_integration_h2,calculus,integration,A,1.0,0.5,B,0.0,A,0.6,A,0.7,A
JiuZhang3.0-7B,calculus_integration_h3,calculus,integration,B,0.0,0.7,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,calculus_limits_e1,calculus,limits,B,1.0,1.0,A,0.65,B,0.95,B,0.9,A
JiuZhang3.0-7B,calculus_limits_e2,calculus,limits,Tie,0.5,0.5,A,0.9,A,0.95,A,1.0,B
JiuZhang3.0-7B,calculus_limits_e3,calculus,limits,Tie,0.5,0.5,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,calculus_limits_m1,calculus,limits,Tie,0.5,0.5,B,0.95,A,0.95,A,0.95,B
JiuZhang3.0-7B,calculus_limits_m2,calculus,limits,B,1.0,1.0,B,0.85,B,0.95,B,0.95,B
JiuZhang3.0-7B,calculus_limits_m3,calculus,limits,Tie,0.5,0.5,B,0.65,A,0.5,B,0.4,B
JiuZhang3.0-7B,calculus_limits_h1,calculus,limits,Tie,0.5,0.5,A,0.8,B,0.7,B,0.4,B
JiuZhang3.0-7B,calculus_limits_h2,calculus,limits,B,1.0,1.0,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,calculus_limits_h3,calculus,limits,A,0.0,1.0,B,1.0,B,1.0,B,0.95,B
JiuZhang3.0-7B,calculus_series_e1,calculus,series,A,0.0,1.0,B,0.95,A,0.95,B,1.0,A
JiuZhang3.0-7B,calculus_series_e2,calculus,series,Tie,0.5,0.5,A,0.9,A,0.95,A,1.0,A
JiuZhang3.0-7B,calculus_series_e3,calculus,series,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,A
JiuZhang3.0-7B,calculus_series_m1,calculus,series,A,0.0,1.0,B,0.85,A,0.95,B,1.0,B
JiuZhang3.0-7B,calculus_series_m2,calculus,series,A,0.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,calculus_series_m3,calculus,series,Tie,0.5,0.5,B,0.95,B,0.95,B,0.9,B
JiuZhang3.0-7B,calculus_series_h1,calculus,series,Tie,0.5,0.5,B,1.0,B,0.98,B,1.0,A
JiuZhang3.0-7B,calculus_series_h2,calculus,series,Tie,0.5,0.5,B,0.85,B,0.95,B,0.9,B
JiuZhang3.0-7B,calculus_series_h3,calculus,series,B,1.0,0.9,B,0.85,B,0.7,B,0.6,B
JiuZhang3.0-7B,calculus_applications_e1,calculus,applications,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,calculus_applications_e2,calculus,applications,A,1.0,1.0,A,0.95,B,0.95,A,0.9,B
JiuZhang3.0-7B,calculus_applications_e3,calculus,applications,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,calculus_applications_m1,calculus,applications,Tie,0.5,0.5,B,0.95,B,0.98,B,1.0,B
JiuZhang3.0-7B,calculus_applications_m2,calculus,applications,B,1.0,1.0,B,1.0,B,0.95,B,0.75,B
JiuZhang3.0-7B,calculus_applications_m3,calculus,applications,Tie,0.5,0.5,A,0.75,A,0.5,B,0.95,B
JiuZhang3.0-7B,calculus_applications_h1,calculus,applications,B,1.0,1.0,B,0.85,B,0.85,A,0.7,A
JiuZhang3.0-7B,calculus_applications_h2,calculus,applications,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,calculus_applications_h3,calculus,applications,A,1.0,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,geometry_plane_e1,geometry,plane geometry,Tie,0.5,0.5,B,0.95,B,0.95,B,0.9,B
JiuZhang3.0-7B,geometry_plane_e2,geometry,plane geometry,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,geometry_plane_e3,geometry,plane geometry,Tie,0.5,0.5,B,0.75,A,0.9,B,0.95,A
JiuZhang3.0-7B,geometry_plane_m1,geometry,plane geometry,Tie,0.5,0.5,B,0.65,A,0.9,A,0.8,B
JiuZhang3.0-7B,geometry_plane_m2,geometry,plane geometry,Tie,0.5,0.5,A,0.9,A,0.95,A,0.95,B
JiuZhang3.0-7B,geometry_plane_m3,geometry,plane geometry,B,1.0,1.0,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,geometry_plane_h1,geometry,plane geometry,B,0.0,1.0,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,geometry_plane_h2,geometry,plane geometry,B,1.0,1.0,B,0.85,B,0.85,B,0.6,B
JiuZhang3.0-7B,geometry_plane_h3,geometry,plane geometry,B,0.0,0.9,B,0.51,A,0.95,A,0.95,A
JiuZhang3.0-7B,geometry_coordinate_e1,geometry,coordinate geometry,Tie,0.5,0.5,B,0.85,A,0.95,A,0.95,B
JiuZhang3.0-7B,geometry_coordinate_e2,geometry,coordinate geometry,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,geometry_coordinate_e3,geometry,coordinate geometry,B,0.0,1.0,A,0.8,A,0.95,A,0.9,B
JiuZhang3.0-7B,geometry_coordinate_m1,geometry,coordinate geometry,B,1.0,0.9,B,0.95,B,0.95,B,0.9,B
JiuZhang3.0-7B,geometry_coordinate_m2,geometry,coordinate geometry,B,1.0,1.0,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,geometry_coordinate_m3,geometry,coordinate geometry,B,1.0,1.0,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,geometry_coordinate_h1,geometry,coordinate geometry,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,geometry_coordinate_h2,geometry,coordinate geometry,B,0.0,1.0,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,geometry_coordinate_h3,geometry,coordinate geometry,Tie,0.5,0.5,B,0.7,A,0.95,A,0.95,A
JiuZhang3.0-7B,geometry_transformations_e1,geometry,transformations,B,0.0,0.5,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,geometry_transformations_e2,geometry,transformations,B,0.0,1.0,A,0.98,A,0.95,A,0.95,A
JiuZhang3.0-7B,geometry_transformations_e3,geometry,transformations,A,1.0,1.0,A,0.85,B,0.95,A,0.95,B
JiuZhang3.0-7B,geometry_transformations_m1,geometry,transformations,B,1.0,1.0,B,0.9,B,0.95,B,0.95,B
JiuZhang3.0-7B,geometry_transformations_m2,geometry,transformations,Tie,0.5,0.5,A,0.75,A,0.9,B,0.4,B
JiuZhang3.0-7B,geometry_transformations_m3,geometry,transformations,Tie,0.5,0.5,B,0.51,A,1.0,B,0.95,A
JiuZhang3.0-7B,geometry_transformations_h1,geometry,transformations,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,geometry_transformations_h2,geometry,transformations,A,1.0,0.5,A,0.6,A,0.85,A,0.7,A
JiuZhang3.0-7B,geometry_transformations_h3,geometry,transformations,B,1.0,0.9,B,0.6,B,0.5,A,0.6,A
JiuZhang3.0-7B,geometry_mensuration_e1,geometry,mensuration,Tie,0.5,0.5,B,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,geometry_mensuration_e2,geometry,mensuration,Tie,0.5,0.5,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,geometry_mensuration_e3,geometry,mensuration,B,0.0,0.8,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,geometry_mensuration_m1,geometry,mensuration,Tie,0.5,0.5,A,0.75,A,0.95,A,1.0,A
JiuZhang3.0-7B,geometry_mensuration_m2,geometry,mensuration,B,1.0,1.0,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,geometry_mensuration_m3,geometry,mensuration,B,0.0,1.0,A,0.75,A,0.95,A,0.95,B
JiuZhang3.0-7B,geometry_mensuration_h1,geometry,mensuration,Tie,0.5,0.5,B,0.85,B,0.85,B,0.7,B
JiuZhang3.0-7B,geometry_mensuration_h2,geometry,mensuration,A,0.0,1.0,B,0.65,B,0.9,A,0.7,A
JiuZhang3.0-7B,geometry_mensuration_h3,geometry,mensuration,Tie,0.5,0.5,B,0.7,A,0.6,B,0.8,A
JiuZhang3.0-7B,geometry_trigonometry_e1,geometry,trigonometry,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,geometry_trigonometry_e2,geometry,trigonometry,Tie,0.5,0.5,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,geometry_trigonometry_e3,geometry,trigonometry,B,1.0,1.0,B,0.55,B,0.95,B,0.95,B
JiuZhang3.0-7B,geometry_trigonometry_m1,geometry,trigonometry,B,1.0,0.9,B,0.65,A,0.75,B,0.6,B
JiuZhang3.0-7B,geometry_trigonometry_m2,geometry,trigonometry,B,1.0,1.0,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,geometry_trigonometry_m3,geometry,trigonometry,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,B
JiuZhang3.0-7B,geometry_trigonometry_h1,geometry,trigonometry,Tie,0.5,0.5,A,0.65,B,0.95,A,0.8,B
JiuZhang3.0-7B,geometry_trigonometry_h2,geometry,trigonometry,A,1.0,1.0,A,0.65,A,0.7,,,A
JiuZhang3.0-7B,geometry_trigonometry_h3,geometry,trigonometry,Tie,0.5,0.5,B,0.75,B,0.7,B,0.7,A
JiuZhang3.0-7B,numbertheory_divisibility_e1,number theory,divisibility,Tie,0.5,0.5,A,1.0,A,0.95,A,1.0,A
JiuZhang3.0-7B,numbertheory_divisibility_e2,number theory,divisibility,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,numbertheory_divisibility_e3,number theory,divisibility,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,numbertheory_divisibility_m1,number theory,divisibility,B,1.0,1.0,B,0.85,A,0.95,B,0.95,A
JiuZhang3.0-7B,numbertheory_divisibility_m2,number theory,divisibility,B,1.0,1.0,B,0.95,A,0.95,B,0.95,A
JiuZhang3.0-7B,numbertheory_divisibility_m3,number theory,divisibility,Tie,0.5,0.5,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,numbertheory_divisibility_h1,number theory,divisibility,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,numbertheory_divisibility_h2,number theory,divisibility,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,numbertheory_divisibility_h3,number theory,divisibility,Tie,0.5,0.5,B,0.85,A,0.95,A,1.0,B
JiuZhang3.0-7B,numbertheory_modular_e1,number theory,modular arithmetic,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,numbertheory_modular_e2,number theory,modular arithmetic,B,1.0,1.0,B,0.95,B,0.95,B,1.0,A
JiuZhang3.0-7B,numbertheory_modular_e3,number theory,modular arithmetic,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,numbertheory_modular_m1,number theory,modular arithmetic,A,0.0,1.0,B,1.0,B,0.98,B,0.95,B
JiuZhang3.0-7B,numbertheory_modular_m2,number theory,modular arithmetic,Tie,0.5,0.5,B,0.8,B,0.75,A,0.7,B
JiuZhang3.0-7B,numbertheory_modular_m3,number theory,modular arithmetic,B,0.0,1.0,A,0.95,A,0.95,A,1.0,B
JiuZhang3.0-7B,numbertheory_modular_h1,number theory,modular arithmetic,A,0.0,1.0,B,0.85,B,0.5,B,0.6,A
JiuZhang3.0-7B,numbertheory_modular_h2,number theory,modular arithmetic,A,0.0,1.0,B,0.8,B,0.85,B,0.7,A
JiuZhang3.0-7B,numbertheory_modular_h3,number theory,modular arithmetic,Tie,0.5,0.5,B,0.9,B,0.7,B,0.7,B
JiuZhang3.0-7B,numbertheory_primes_e1,number theory,primes,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,numbertheory_primes_e2,number theory,primes,A,1.0,1.0,B,0.75,A,0.95,A,0.9,B
JiuZhang3.0-7B,numbertheory_primes_e3,number theory,primes,Tie,0.5,0.5,A,0.7,A,1.0,A,1.0,A
JiuZhang3.0-7B,numbertheory_primes_m1,number theory,primes,Tie,0.5,0.5,B,1.0,B,0.95,B,0.95,B
JiuZhang3.0-7B,numbertheory_primes_m2,number theory,primes,Tie,0.5,0.5,A,0.95,B,0.95,B,0.9,B
JiuZhang3.0-7B,numbertheory_primes_m3,number theory,primes,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
JiuZhang3.0-7B,numbertheory_primes_h1,number theory,primes,A,0.0,1.0,B,0.9,B,0.95,B,0.95,B
JiuZhang3.0-7B,numbertheory_primes_h2,number theory,primes,A,1.0,1.0,A,0.6,A,0.8,A,0.8,A
JiuZhang3.0-7B,numbertheory_primes_h3,number theory,primes,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,numbertheory_diophantine_e1,number theory,diophantine equations,B,0.0,0.5,A,1.0,A,0.95,A,0.8,B
JiuZhang3.0-7B,numbertheory_diophantine_e2,number theory,diophantine equations,Tie,0.5,0.5,B,0.95,B,0.9,B,0.7,A
JiuZhang3.0-7B,numbertheory_diophantine_e3,number theory,diophantine equations,A,1.0,1.0,A,0.8,A,0.95,A,0.95,A
JiuZhang3.0-7B,numbertheory_diophantine_m1,number theory,diophantine equations,Tie,0.5,0.5,B,0.95,B,0.98,B,1.0,B
JiuZhang3.0-7B,numbertheory_diophantine_m2,number theory,diophantine equations,Tie,0.5,0.5,A,0.85,A,0.85,A,0.7,B
JiuZhang3.0-7B,numbertheory_diophantine_m3,number theory,diophantine equations,Tie,0.5,0.5,A,0.75,A,0.9,A,0.9,B
JiuZhang3.0-7B,numbertheory_diophantine_h1,number theory,diophantine equations,A,0.0,0.9,B,0.65,B,0.7,B,0.7,B
JiuZhang3.0-7B,numbertheory_diophantine_h2,number theory,diophantine equations,A,1.0,0.5,A,0.85,A,0.7,A,0.7,B
JiuZhang3.0-7B,numbertheory_diophantine_h3,number theory,diophantine equations,B,1.0,1.0,B,0.85,B,0.95,B,0.7,B
JiuZhang3.0-7B,numbertheory_sequences_e1,number theory,number sequences,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
JiuZhang3.0-7B,numbertheory_sequences_e2,number theory,number sequences,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,numbertheory_sequences_e3,number theory,number sequences,B,0.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,numbertheory_sequences_m1,number theory,number sequences,B,0.0,1.0,B,0.8,A,0.95,A,1.0,A
JiuZhang3.0-7B,numbertheory_sequences_m2,number theory,number sequences,A,1.0,1.0,A,0.95,A,0.6,A,0.4,A
JiuZhang3.0-7B,numbertheory_sequences_m3,number theory,number sequences,Tie,0.5,0.5,B,0.6,A,0.99,B,0.95,A
JiuZhang3.0-7B,numbertheory_sequences_h1,number theory,number sequences,Tie,0.5,0.5,A,0.85,A,0.9,A,0.8,A
JiuZhang3.0-7B,numbertheory_sequences_h2,number theory,number sequences,Tie,0.5,0.5,A,0.6,B,0.6,A,0.7,B
JiuZhang3.0-7B,numbertheory_sequences_h3,number theory,number sequences,Tie,0.5,0.5,B,1.0,B,0.95,B,1.0,A
JiuZhang3.0-7B,combinatorics_counting_e1,combinatorics,counting principles,Tie,0.5,0.5,B,1.0,A,0.5,B,1.0,B
JiuZhang3.0-7B,combinatorics_counting_e2,combinatorics,counting principles,Tie,0.5,0.5,A,0.85,A,0.95,B,0.95,A
JiuZhang3.0-7B,combinatorics_counting_e3,combinatorics,counting principles,Tie,0.5,0.5,B,0.6,B,0.95,B,0.95,B
JiuZhang3.0-7B,combinatorics_counting_m1,combinatorics,counting principles,Tie,0.5,0.5,A,0.65,A,0.95,A,0.95,A
JiuZhang3.0-7B,combinatorics_counting_m2,combinatorics,counting principles,A,0.0,1.0,B,0.65,A,0.95,B,0.9,B
JiuZhang3.0-7B,combinatorics_counting_m3,combinatorics,counting principles,A,1.0,0.5,B,0.75,A,0.9,,,A
JiuZhang3.0-7B,combinatorics_counting_h1,combinatorics,counting principles,B,0.0,1.0,A,0.9,A,0.95,A,0.9,A
JiuZhang3.0-7B,combinatorics_counting_h2,combinatorics,counting principles,A,0.0,0.5,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,combinatorics_counting_h3,combinatorics,counting principles,Tie,0.5,0.5,A,1.0,A,0.95,A,1.0,A
JiuZhang3.0-7B,combinatorics_permutations_e1,combinatorics,permutations,A,1.0,1.0,B,0.65,A,0.95,A,0.9,A
JiuZhang3.0-7B,combinatorics_permutations_e2,combinatorics,permutations,B,0.0,1.0,B,0.51,A,0.95,A,0.95,A
JiuZhang3.0-7B,combinatorics_permutations_e3,combinatorics,permutations,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,combinatorics_permutations_m1,combinatorics,permutations,A,1.0,1.0,A,0.6,A,0.95,A,0.95,A
JiuZhang3.0-7B,combinatorics_permutations_m2,combinatorics,permutations,Tie,0.5,0.5,B,0.7,B,1.0,B,0.95,A
JiuZhang3.0-7B,combinatorics_permutations_m3,combinatorics,permutations,Tie,0.5,0.5,B,0.65,A,0.95,A,0.9,B
JiuZhang3.0-7B,combinatorics_permutations_h1,combinatorics,permutations,A,0.0,0.9,B,0.9,B,1.0,B,0.7,B
JiuZhang3.0-7B,combinatorics_permutations_h2,combinatorics,permutations,Tie,0.5,0.5,A,0.7,A,0.9,A,0.7,B
JiuZhang3.0-7B,combinatorics_permutations_h3,combinatorics,permutations,Tie,0.5,0.5,A,0.7,B,0.5,A,0.7,A
JiuZhang3.0-7B,combinatorics_combinations_e1,combinatorics,combinations,A,1.0,1.0,A,1.0,A,0.95,A,0.95,A
JiuZhang3.0-7B,combinatorics_combinations_e2,combinatorics,combinations,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,combinatorics_combinations_e3,combinatorics,combinations,Tie,0.5,0.5,A,0.55,A,0.95,A,0.95,A
JiuZhang3.0-7B,combinatorics_combinations_m1,combinatorics,combinations,A,0.0,1.0,B,0.55,A,0.95,B,1.0,B
JiuZhang3.0-7B,combinatorics_combinations_m2,combinatorics,combinations,Tie,0.5,0.5,B,0.85,A,0.95,A,1.0,B
JiuZhang3.0-7B,combinatorics_combinations_m3,combinatorics,combinations,Tie,0.5,0.5,B,0.95,B,0.95,B,1.0,A
JiuZhang3.0-7B,combinatorics_combinations_h1,combinatorics,combinations,Tie,0.5,0.5,B,0.9,B,0.95,B,0.9,A
JiuZhang3.0-7B,combinatorics_combinations_h2,combinatorics,combinations,A,1.0,1.0,A,0.85,A,0.9,A,0.8,B
JiuZhang3.0-7B,combinatorics_combinations_h3,combinatorics,combinations,Tie,0.5,0.5,B,0.95,B,0.9,A,0.8,B
JiuZhang3.0-7B,combinatorics_probability_e1,combinatorics,probability,Tie,0.5,0.5,A,0.85,A,0.95,A,1.0,A
JiuZhang3.0-7B,combinatorics_probability_e2,combinatorics,probability,A,0.0,1.0,A,0.55,B,0.95,B,0.95,B
JiuZhang3.0-7B,combinatorics_probability_e3,combinatorics,probability,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,combinatorics_probability_m1,combinatorics,probability,B,1.0,1.0,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,combinatorics_probability_m2,combinatorics,probability,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,combinatorics_probability_m3,combinatorics,probability,A,0.0,1.0,B,0.85,B,0.95,B,1.0,A
JiuZhang3.0-7B,combinatorics_probability_h1,combinatorics,probability,B,1.0,1.0,B,0.95,B,0.98,B,1.0,B
JiuZhang3.0-7B,combinatorics_probability_h2,combinatorics,probability,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
JiuZhang3.0-7B,combinatorics_probability_h3,combinatorics,probability,B,0.0,1.0,B,0.6,A,0.5,A,0.8,B
JiuZhang3.0-7B,combinatorics_recursion_e1,combinatorics,recursion,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,combinatorics_recursion_e2,combinatorics,recursion,Tie,0.5,0.5,A,1.0,A,0.95,A,1.0,A
JiuZhang3.0-7B,combinatorics_recursion_e3,combinatorics,recursion,Tie,0.5,0.5,A,1.0,A,0.95,A,1.0,A
JiuZhang3.0-7B,combinatorics_recursion_m1,combinatorics,recursion,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
JiuZhang3.0-7B,combinatorics_recursion_m2,combinatorics,recursion,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,combinatorics_recursion_m3,combinatorics,recursion,Tie,0.5,0.5,B,0.85,B,0.7,,,A
JiuZhang3.0-7B,combinatorics_recursion_h1,combinatorics,recursion,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,combinatorics_recursion_h2,combinatorics,recursion,Tie,0.5,0.5,B,1.0,B,0.95,B,0.9,A
JiuZhang3.0-7B,combinatorics_recursion_h3,combinatorics,recursion,Tie,0.5,0.5,A,0.6,A,0.6,,,B
JiuZhang3.0-7B,statistics_descriptive_e1,statistics,descriptive statistics,Tie,0.5,0.5,B,0.85,A,0.95,A,1.0,B
JiuZhang3.0-7B,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,1.0,A,0.85,A,0.95,B,0.7,A
JiuZhang3.0-7B,statistics_descriptive_e3,statistics,descriptive statistics,B,1.0,1.0,B,0.95,B,0.95,B,0.95,B
JiuZhang3.0-7B,statistics_descriptive_m1,statistics,descriptive statistics,Tie,0.5,0.5,B,0.75,B,0.95,A,0.9,A
JiuZhang3.0-7B,statistics_descriptive_m2,statistics,descriptive statistics,B,0.0,1.0,A,0.55,B,0.9,A,0.9,A
JiuZhang3.0-7B,statistics_descriptive_m3,statistics,descriptive statistics,A,1.0,1.0,A,1.0,A,0.85,A,0.9,A
JiuZhang3.0-7B,statistics_descriptive_h1,statistics,descriptive statistics,A,1.0,1.0,A,0.95,A,0.99,A,0.95,A
JiuZhang3.0-7B,statistics_descriptive_h2,statistics,descriptive statistics,Tie,0.5,0.5,B,0.85,B,0.9,B,0.7,A
JiuZhang3.0-7B,statistics_descriptive_h3,statistics,descriptive statistics,Tie,0.5,0.5,A,0.7,A,0.7,A,0.6,B
JiuZhang3.0-7B,statistics_distributions_e1,statistics,distributions,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,statistics_distributions_e2,statistics,distributions,Tie,0.5,0.5,A,0.9,A,0.95,A,1.0,B
JiuZhang3.0-7B,statistics_distributions_e3,statistics,distributions,Tie,0.5,0.5,B,0.9,A,0.95,B,0.95,A
JiuZhang3.0-7B,statistics_distributions_m1,statistics,distributions,Tie,0.5,0.5,A,0.95,A,0.98,A,1.0,A
JiuZhang3.0-7B,statistics_distributions_m2,statistics,distributions,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,statistics_distributions_m3,statistics,distributions,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,statistics_distributions_h1,statistics,distributions,B,0.0,0.8,A,0.9,A,0.95,A,0.95,A
JiuZhang3.0-7B,statistics_distributions_h2,statistics,distributions,A,1.0,1.0,A,0.98,A,0.95,A,1.0,B
JiuZhang3.0-7B,statistics_distributions_h3,statistics,distributions,Tie,0.5,0.5,B,0.9,B,0.98,B,0.95,A
JiuZhang3.0-7B,statistics_hypothesis_e1,statistics,hypothesis testing,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,statistics_hypothesis_e2,statistics,hypothesis testing,Tie,0.5,0.5,A,1.0,A,0.95,A,1.0,B
JiuZhang3.0-7B,statistics_hypothesis_e3,statistics,hypothesis testing,Tie,0.5,0.5,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,statistics_hypothesis_m1,statistics,hypothesis testing,A,0.0,0.5,B,0.85,A,0.95,B,0.95,A
JiuZhang3.0-7B,statistics_hypothesis_m2,statistics,hypothesis testing,A,1.0,1.0,A,0.95,A,1.0,A,0.7,A
JiuZhang3.0-7B,statistics_hypothesis_m3,statistics,hypothesis testing,B,1.0,1.0,B,0.9,B,0.95,A,0.8,B
JiuZhang3.0-7B,statistics_hypothesis_h1,statistics,hypothesis testing,A,1.0,1.0,A,0.95,A,0.85,A,0.7,A
JiuZhang3.0-7B,statistics_hypothesis_h2,statistics,hypothesis testing,Tie,0.5,0.5,B,0.75,A,0.85,A,0.9,B
JiuZhang3.0-7B,statistics_hypothesis_h3,statistics,hypothesis testing,Tie,0.5,0.5,B,1.0,B,0.99,B,0.95,B
JiuZhang3.0-7B,statistics_regression_e1,statistics,regression,A,1.0,0.9,A,0.95,B,0.95,A,1.0,A
JiuZhang3.0-7B,statistics_regression_e2,statistics,regression,Tie,0.5,0.5,A,0.85,B,0.95,B,0.9,B
JiuZhang3.0-7B,statistics_regression_e3,statistics,regression,Tie,0.5,0.5,B,0.95,B,0.95,B,0.95,A
JiuZhang3.0-7B,statistics_regression_m1,statistics,regression,B,1.0,1.0,B,0.98,B,0.95,B,1.0,B
JiuZhang3.0-7B,statistics_regression_m2,statistics,regression,Tie,0.5,0.5,B,0.6,B,0.95,B,1.0,B
JiuZhang3.0-7B,statistics_regression_m3,statistics,regression,Tie,0.5,0.5,A,0.85,B,0.95,B,0.95,A
JiuZhang3.0-7B,statistics_regression_h1,statistics,regression,Tie,0.5,0.5,A,0.85,A,0.95,A,1.0,A
JiuZhang3.0-7B,statistics_regression_h2,statistics,regression,A,1.0,1.0,A,0.95,A,0.95,A,0.9,A
JiuZhang3.0-7B,statistics_regression_h3,statistics,regression,A,0.0,1.0,B,0.85,B,0.95,A,0.9,B
JiuZhang3.0-7B,statistics_bayesian_e1,statistics,bayesian inference,Tie,0.5,0.5,A,0.85,A,0.85,A,0.8,B
JiuZhang3.0-7B,statistics_bayesian_e2,statistics,bayesian inference,A,1.0,0.95,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,statistics_bayesian_e3,statistics,bayesian inference,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,B
JiuZhang3.0-7B,statistics_bayesian_m1,statistics,bayesian inference,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,A
JiuZhang3.0-7B,statistics_bayesian_m2,statistics,bayesian inference,Tie,0.5,0.5,B,1.0,B,0.95,B,1.0,B
JiuZhang3.0-7B,statistics_bayesian_m3,statistics,bayesian inference,Tie,0.5,0.5,B,0.85,B,0.95,,,A
JiuZhang3.0-7B,statistics_bayesian_h1,statistics,bayesian inference,Tie,0.5,0.5,B,0.9,B,0.95,B,0.9,B
JiuZhang3.0-7B,statistics_bayesian_h2,statistics,bayesian inference,B,1.0,1.0,A,0.7,B,0.7,B,0.4,B
JiuZhang3.0-7B,statistics_bayesian_h3,statistics,bayesian inference,Tie,0.5,0.5,B,0.9,B,0.95,B,0.9,B
JiuZhang3.0-7B,linearalgebra_matrices_e1,linear algebra,matrices,B,1.0,1.0,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,linearalgebra_matrices_e2,linear algebra,matrices,B,0.0,1.0,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,linearalgebra_matrices_e3,linear algebra,matrices,A,1.0,0.9,A,1.0,A,0.9,A,1.0,B
JiuZhang3.0-7B,linearalgebra_matrices_m1,linear algebra,matrices,B,0.0,1.0,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,linearalgebra_matrices_m2,linear algebra,matrices,Tie,0.5,0.5,B,0.95,A,0.95,B,0.95,B
JiuZhang3.0-7B,linearalgebra_matrices_m3,linear algebra,matrices,Tie,0.5,0.5,A,1.0,A,0.98,A,1.0,A
JiuZhang3.0-7B,linearalgebra_matrices_h1,linear algebra,matrices,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,linearalgebra_matrices_h2,linear algebra,matrices,A,0.0,1.0,B,1.0,B,1.0,B,1.0,B
JiuZhang3.0-7B,linearalgebra_matrices_h3,linear algebra,matrices,Tie,0.5,0.5,B,1.0,B,0.98,B,1.0,B
JiuZhang3.0-7B,linearalgebra_determinants_e1,linear algebra,determinants,B,1.0,1.0,B,0.95,A,0.95,B,0.9,A
JiuZhang3.0-7B,linearalgebra_determinants_e2,linear algebra,determinants,Tie,0.5,0.5,A,0.95,A,0.95,A,1.0,B
JiuZhang3.0-7B,linearalgebra_determinants_e3,linear algebra,determinants,B,1.0,1.0,B,0.9,B,0.98,B,1.0,B
JiuZhang3.0-7B,linearalgebra_determinants_m1,linear algebra,determinants,Tie,0.5,0.5,B,0.95,B,0.95,B,1.0,B
JiuZhang3.0-7B,linearalgebra_determinants_m2,linear algebra,determinants,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,A
JiuZhang3.0-7B,linearalgebra_determinants_m3,linear algebra,determinants,B,1.0,1.0,B,0.85,B,0.95,B,0.95,B
JiuZhang3.0-7B,linearalgebra_determinants_h1,linear algebra,determinants,Tie,0.5,0.5,A,0.6,B,0.85,,,A
JiuZhang3.0-7B,linearalgebra_determinants_h2,linear algebra,determinants,Tie,0.5,0.5,B,0.95,B,0.4,B,0.75,B
JiuZhang3.0-7B,linearalgebra_determinants_h3,linear algebra,determinants,Tie,0.5,0.5,B,0.9,B,0.95,B,1.0,A
JiuZhang3.0-7B,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,0.0,0.9,B,0.95,B,0.98,B,1.0,B
JiuZhang3.0-7B,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,B,1.0,0.5,B,1.0,B,0.95,B,1.0,A
JiuZhang3.0-7B,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,Tie,0.5,0.5,B,0.85,A,0.95,B,0.95,A
JiuZhang3.0-7B,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,B,1.0,0.8,B,0.95,B,0.95,A,1.0,A
JiuZhang3.0-7B,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,Tie,0.5,0.5,A,0.85,B,0.95,A,0.95,A
JiuZhang3.0-7B,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,1.0,1.0,A,0.7,A,0.6,B,0.9,B
JiuZhang3.0-7B,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,A,0.0,0.5,B,0.65,B,0.7,B,0.4,A
JiuZhang3.0-7B,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,0.0,0.5,B,1.0,B,0.98,B,1.0,B
JiuZhang3.0-7B,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,Tie,0.5,0.5,A,0.9,A,0.9,A,0.7,A
JiuZhang3.0-7B,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,1.0,1.0,A,0.95,A,0.95,A,1.0,B
JiuZhang3.0-7B,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,Tie,0.5,0.5,A,1.0,A,1.0,A,1.0,B
JiuZhang3.0-7B,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,B,1.0,1.0,B,0.85,B,0.95,B,1.0,B
JiuZhang3.0-7B,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,B,1.0,1.0,B,0.98,B,0.98,B,1.0,B
JiuZhang3.0-7B,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,A,0.0,0.95,B,0.95,B,0.95,B,0.8,B
JiuZhang3.0-7B,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,Tie,0.5,0.5,B,0.95,B,1.0,B,1.0,A
JiuZhang3.0-7B,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,B,1.0,0.5,B,0.65,B,0.85,,,B
JiuZhang3.0-7B,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,B,1.0,0.95,B,1.0,B,0.9,B,0.6,A
JiuZhang3.0-7B,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,B,0.0,0.5,A,0.6,A,0.85,,,A
JiuZhang3.0-7B,linearalgebra_transformations_e1,linear algebra,linear transformations,Tie,0.5,0.5,A,0.75,A,0.95,B,1.0,A
JiuZhang3.0-7B,linearalgebra_transformations_e2,linear algebra,linear transformations,A,0.0,1.0,B,0.85,B,0.95,B,0.9,B
JiuZhang3.0-7B,linearalgebra_transformations_e3,linear algebra,linear transformations,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
JiuZhang3.0-7B,linearalgebra_transformations_m1,linear algebra,linear transformations,Tie,0.5,0.5,B,0.85,B,0.95,B,0.95,A
JiuZhang3.0-7B,linearalgebra_transformations_m2,linear algebra,linear transformations,Tie,0.5,0.5,B,1.0,B,1.0,B,1.0,A
JiuZhang3.0-7B,linearalgebra_transformations_m3,linear algebra,linear transformations,Tie,0.5,0.5,B,0.9,B,0.95,A,0.95,B
JiuZhang3.0-7B,linearalgebra_transformations_h1,linear algebra,linear transformations,Tie,0.5,0.5,B,0.75,B,0.95,,,A
JiuZhang3.0-7B,linearalgebra_transformations_h2,linear algebra,linear transformations,Tie,0.5,0.5,B,0.85,B,0.98,B,0.8,A
JiuZhang3.0-7B,linearalgebra_transformations_h3,linear algebra,linear transformations,Tie,0.5,0.5,A,1.0,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,arithmetic_basic_operations_e1,arithmetic,basic operations,A,1.0,0.95,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,arithmetic_basic_operations_e2,arithmetic,basic operations,A,1.0,1.0,A,0.95,A,0.95,A,0.75,A
Ministral-8B-Instruct-2410,arithmetic_basic_operations_e3,arithmetic,basic operations,B,1.0,1.0,B,0.95,B,0.95,A,0.95,B
Ministral-8B-Instruct-2410,arithmetic_basic_operations_m1,arithmetic,basic operations,B,1.0,0.95,B,0.98,B,1.0,B,0.9,A
Ministral-8B-Instruct-2410,arithmetic_basic_operations_m2,arithmetic,basic operations,B,0.0,0.9,A,0.95,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,arithmetic_basic_operations_m3,arithmetic,basic operations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_basic_operations_h1,arithmetic,basic operations,A,0.0,0.95,A,0.85,B,0.95,B,0.9,B
Ministral-8B-Instruct-2410,arithmetic_basic_operations_h2,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_basic_operations_h3,arithmetic,basic operations,A,1.0,0.95,A,0.8,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,arithmetic_fractions_e1,arithmetic,fractions,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_fractions_e2,arithmetic,fractions,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_fractions_e3,arithmetic,fractions,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_fractions_m1,arithmetic,fractions,A,0.0,0.95,A,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_fractions_m2,arithmetic,fractions,B,0.0,0.95,A,0.85,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,arithmetic_fractions_m3,arithmetic,fractions,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_fractions_h1,arithmetic,fractions,B,1.0,0.95,B,0.9,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,arithmetic_fractions_h2,arithmetic,fractions,B,1.0,1.0,B,0.85,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,arithmetic_fractions_h3,arithmetic,fractions,A,1.0,0.85,A,0.9,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_percentages_e1,arithmetic,percentages,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_percentages_e2,arithmetic,percentages,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,arithmetic_percentages_e3,arithmetic,percentages,A,1.0,0.95,A,0.85,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,arithmetic_percentages_m1,arithmetic,percentages,B,0.0,0.9,B,0.9,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_percentages_m2,arithmetic,percentages,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_percentages_m3,arithmetic,percentages,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_percentages_h1,arithmetic,percentages,B,0.0,0.95,A,0.9,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_percentages_h2,arithmetic,percentages,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_percentages_h3,arithmetic,percentages,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_numerical_e1,arithmetic,numerical approximation,A,1.0,0.95,A,0.85,A,0.95,B,1.0,B
Ministral-8B-Instruct-2410,arithmetic_numerical_e2,arithmetic,numerical approximation,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_numerical_e3,arithmetic,numerical approximation,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_numerical_m1,arithmetic,numerical approximation,A,1.0,0.95,A,1.0,A,0.85,A,0.7,A
Ministral-8B-Instruct-2410,arithmetic_numerical_m2,arithmetic,numerical approximation,B,0.0,0.85,A,0.95,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,arithmetic_numerical_m3,arithmetic,numerical approximation,B,1.0,0.9,B,0.98,B,0.95,B,1.0,A
Ministral-8B-Instruct-2410,arithmetic_numerical_h1,arithmetic,numerical approximation,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_numerical_h2,arithmetic,numerical approximation,A,1.0,0.95,B,0.8,A,0.95,,,B
Ministral-8B-Instruct-2410,arithmetic_numerical_h3,arithmetic,numerical approximation,B,1.0,0.95,B,0.95,B,0.95,B,1.0,A
Ministral-8B-Instruct-2410,arithmetic_order_e1,arithmetic,order of operations,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_order_e2,arithmetic,order of operations,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_order_e3,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_order_m1,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,arithmetic_order_m2,arithmetic,order of operations,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_order_m3,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,arithmetic_order_h1,arithmetic,order of operations,B,0.0,0.9,A,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,arithmetic_order_h2,arithmetic,order of operations,A,1.0,0.9,B,0.9,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,arithmetic_order_h3,arithmetic,order of operations,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
Ministral-8B-Instruct-2410,algebra_equations_e1,algebra,equations,A,0.0,0.95,B,0.98,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_equations_e2,algebra,equations,A,0.0,0.85,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,algebra_equations_e3,algebra,equations,A,1.0,1.0,A,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,algebra_equations_m1,algebra,equations,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,algebra_equations_m2,algebra,equations,B,0.0,0.95,A,0.95,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,algebra_equations_m3,algebra,equations,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,algebra_equations_h1,algebra,equations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,algebra_equations_h2,algebra,equations,B,0.0,0.95,A,1.0,A,1.0,A,0.9,A
Ministral-8B-Instruct-2410,algebra_equations_h3,algebra,equations,B,0.0,0.6,A,0.95,B,0.85,A,0.8,B
Ministral-8B-Instruct-2410,algebra_inequalities_e1,algebra,inequalities,A,0.0,0.9,B,0.85,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_inequalities_e2,algebra,inequalities,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,algebra_inequalities_e3,algebra,inequalities,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,algebra_inequalities_m1,algebra,inequalities,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_inequalities_m2,algebra,inequalities,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,algebra_inequalities_m3,algebra,inequalities,A,0.0,0.9,B,0.7,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_inequalities_h1,algebra,inequalities,A,1.0,0.9,A,0.85,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,algebra_inequalities_h2,algebra,inequalities,B,1.0,0.95,B,0.9,B,0.95,B,0.9,A
Ministral-8B-Instruct-2410,algebra_inequalities_h3,algebra,inequalities,B,0.0,0.95,A,0.85,B,0.98,A,0.95,A
Ministral-8B-Instruct-2410,algebra_polynomials_e1,algebra,polynomials,B,1.0,1.0,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_polynomials_e2,algebra,polynomials,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_polynomials_e3,algebra,polynomials,A,1.0,0.85,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,algebra_polynomials_m1,algebra,polynomials,B,0.0,0.95,A,0.95,A,0.98,A,1.0,A
Ministral-8B-Instruct-2410,algebra_polynomials_m2,algebra,polynomials,B,1.0,0.9,B,1.0,B,1.0,B,1.0,A
Ministral-8B-Instruct-2410,algebra_polynomials_m3,algebra,polynomials,B,1.0,0.95,B,1.0,B,1.0,B,1.0,A
Ministral-8B-Instruct-2410,algebra_polynomials_h1,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,algebra_polynomials_h2,algebra,polynomials,B,1.0,0.95,B,0.75,B,0.6,A,0.7,A
Ministral-8B-Instruct-2410,algebra_polynomials_h3,algebra,polynomials,B,0.0,1.0,B,0.75,A,0.6,A,0.7,A
Ministral-8B-Instruct-2410,algebra_functions_e1,algebra,functions,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,algebra_functions_e2,algebra,functions,B,0.0,0.95,A,0.85,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,algebra_functions_e3,algebra,functions,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_functions_m1,algebra,functions,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,algebra_functions_m2,algebra,functions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,algebra_functions_m3,algebra,functions,A,0.0,1.0,B,0.95,A,0.95,B,0.8,A
Ministral-8B-Instruct-2410,algebra_functions_h1,algebra,functions,A,0.0,1.0,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_functions_h2,algebra,functions,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,algebra_functions_h3,algebra,functions,B,0.0,0.95,A,0.7,A,0.75,A,0.7,B
Ministral-8B-Instruct-2410,algebra_systems_e1,algebra,systems of equations,A,1.0,0.9,A,0.85,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_systems_e2,algebra,systems of equations,B,0.0,0.9,B,0.65,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,algebra_systems_e3,algebra,systems of equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,algebra_systems_m1,algebra,systems of equations,B,1.0,0.9,B,0.98,B,1.0,B,1.0,A
Ministral-8B-Instruct-2410,algebra_systems_m2,algebra,systems of equations,B,0.0,0.9,A,0.85,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,algebra_systems_m3,algebra,systems of equations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,algebra_systems_h1,algebra,systems of equations,B,1.0,0.85,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,algebra_systems_h2,algebra,systems of equations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,algebra_systems_h3,algebra,systems of equations,B,0.0,1.0,A,1.0,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,calculus_differentiation_e1,calculus,differentiation,B,1.0,0.9,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,calculus_differentiation_e2,calculus,differentiation,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.95,A,0.85,A,0.98,A,0.95,B
Ministral-8B-Instruct-2410,calculus_differentiation_m1,calculus,differentiation,B,1.0,0.9,B,0.9,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,calculus_differentiation_m2,calculus,differentiation,A,1.0,0.9,A,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,calculus_differentiation_m3,calculus,differentiation,B,1.0,0.8,B,0.98,B,0.99,B,0.95,B
Ministral-8B-Instruct-2410,calculus_differentiation_h1,calculus,differentiation,B,0.0,1.0,B,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,calculus_differentiation_h2,calculus,differentiation,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,calculus_differentiation_h3,calculus,differentiation,A,1.0,0.95,A,1.0,A,1.0,A,1.0,B
Ministral-8B-Instruct-2410,calculus_integration_e1,calculus,integration,B,1.0,0.9,B,1.0,B,1.0,B,1.0,B
Ministral-8B-Instruct-2410,calculus_integration_e2,calculus,integration,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,calculus_integration_e3,calculus,integration,A,0.0,0.95,B,0.95,B,0.95,A,0.9,A
Ministral-8B-Instruct-2410,calculus_integration_m1,calculus,integration,B,1.0,0.95,B,0.95,A,0.95,B,1.0,A
Ministral-8B-Instruct-2410,calculus_integration_m2,calculus,integration,B,1.0,1.0,B,1.0,B,1.0,B,1.0,A
Ministral-8B-Instruct-2410,calculus_integration_m3,calculus,integration,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,calculus_integration_h1,calculus,integration,A,0.0,1.0,B,0.95,B,0.95,B,1.0,A
Ministral-8B-Instruct-2410,calculus_integration_h2,calculus,integration,B,0.0,0.95,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,calculus_integration_h3,calculus,integration,A,1.0,0.95,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,calculus_limits_e1,calculus,limits,B,0.0,0.95,A,0.95,A,0.9,A,1.0,A
Ministral-8B-Instruct-2410,calculus_limits_e2,calculus,limits,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Ministral-8B-Instruct-2410,calculus_limits_e3,calculus,limits,A,1.0,0.95,B,0.9,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,calculus_limits_m1,calculus,limits,B,1.0,0.9,B,0.92,B,0.95,A,0.95,B
Ministral-8B-Instruct-2410,calculus_limits_m2,calculus,limits,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,calculus_limits_m3,calculus,limits,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,calculus_limits_h1,calculus,limits,B,1.0,1.0,B,0.75,B,0.9,,,B
Ministral-8B-Instruct-2410,calculus_limits_h2,calculus,limits,A,1.0,0.9,A,1.0,A,1.0,A,1.0,B
Ministral-8B-Instruct-2410,calculus_limits_h3,calculus,limits,A,0.0,0.95,B,0.85,A,0.95,B,0.9,B
Ministral-8B-Instruct-2410,calculus_series_e1,calculus,series,A,0.0,0.95,B,0.75,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,calculus_series_e2,calculus,series,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,calculus_series_e3,calculus,series,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,calculus_series_m1,calculus,series,B,0.0,0.95,A,0.9,A,0.95,B,0.9,A
Ministral-8B-Instruct-2410,calculus_series_m2,calculus,series,A,0.0,0.9,B,0.85,A,0.9,B,0.95,A
Ministral-8B-Instruct-2410,calculus_series_m3,calculus,series,B,1.0,0.9,B,0.85,B,0.85,,,A
Ministral-8B-Instruct-2410,calculus_series_h1,calculus,series,A,0.0,0.95,B,1.0,B,0.98,B,1.0,B
Ministral-8B-Instruct-2410,calculus_series_h2,calculus,series,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,calculus_series_h3,calculus,series,B,1.0,0.95,B,0.95,B,0.95,B,0.9,B
Ministral-8B-Instruct-2410,calculus_applications_e1,calculus,applications,A,1.0,0.95,A,0.75,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,calculus_applications_e2,calculus,applications,B,0.0,0.8,A,1.0,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,calculus_applications_e3,calculus,applications,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,calculus_applications_m1,calculus,applications,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,calculus_applications_m2,calculus,applications,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,calculus_applications_m3,calculus,applications,B,0.0,0.9,A,0.9,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,calculus_applications_h1,calculus,applications,B,1.0,0.95,B,0.7,B,0.9,,,B
Ministral-8B-Instruct-2410,calculus_applications_h2,calculus,applications,B,1.0,0.9,B,0.95,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,calculus_applications_h3,calculus,applications,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Ministral-8B-Instruct-2410,geometry_plane_e1,geometry,plane geometry,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_plane_e2,geometry,plane geometry,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_plane_e3,geometry,plane geometry,A,0.0,0.95,B,0.9,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_plane_m1,geometry,plane geometry,B,0.0,0.95,A,0.8,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_plane_m2,geometry,plane geometry,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_plane_m3,geometry,plane geometry,A,1.0,1.0,B,0.8,A,0.95,A,0.9,B
Ministral-8B-Instruct-2410,geometry_plane_h1,geometry,plane geometry,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,geometry_plane_h2,geometry,plane geometry,A,0.0,1.0,B,1.0,B,1.0,B,1.0,B
Ministral-8B-Instruct-2410,geometry_plane_h3,geometry,plane geometry,B,0.0,0.9,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,geometry_coordinate_e1,geometry,coordinate geometry,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_coordinate_e2,geometry,coordinate geometry,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,geometry_coordinate_e3,geometry,coordinate geometry,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_coordinate_m1,geometry,coordinate geometry,B,1.0,0.95,B,0.85,B,0.9,A,0.9,A
Ministral-8B-Instruct-2410,geometry_coordinate_m2,geometry,coordinate geometry,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,geometry_coordinate_m3,geometry,coordinate geometry,B,1.0,0.95,B,0.95,A,0.95,B,1.0,A
Ministral-8B-Instruct-2410,geometry_coordinate_h1,geometry,coordinate geometry,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,geometry_coordinate_h2,geometry,coordinate geometry,B,1.0,0.85,B,0.85,B,0.98,B,0.95,B
Ministral-8B-Instruct-2410,geometry_coordinate_h3,geometry,coordinate geometry,B,1.0,1.0,B,1.0,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_transformations_e1,geometry,transformations,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,geometry_transformations_e2,geometry,transformations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_transformations_e3,geometry,transformations,B,1.0,0.9,B,0.85,B,0.95,A,0.95,B
Ministral-8B-Instruct-2410,geometry_transformations_m1,geometry,transformations,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,geometry_transformations_m2,geometry,transformations,A,0.0,1.0,B,0.95,B,0.85,B,0.8,B
Ministral-8B-Instruct-2410,geometry_transformations_m3,geometry,transformations,B,0.0,1.0,A,0.95,B,0.9,A,0.95,B
Ministral-8B-Instruct-2410,geometry_transformations_h1,geometry,transformations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,geometry_transformations_h2,geometry,transformations,B,1.0,0.9,B,0.9,B,0.95,,,B
Ministral-8B-Instruct-2410,geometry_transformations_h3,geometry,transformations,A,0.0,0.9,B,0.85,B,0.8,,,A
Ministral-8B-Instruct-2410,geometry_mensuration_e1,geometry,mensuration,B,1.0,1.0,B,0.98,B,0.95,A,0.85,B
Ministral-8B-Instruct-2410,geometry_mensuration_e2,geometry,mensuration,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_mensuration_e3,geometry,mensuration,B,0.0,1.0,A,1.0,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,geometry_mensuration_m1,geometry,mensuration,B,1.0,0.95,B,0.95,B,0.98,B,1.0,A
Ministral-8B-Instruct-2410,geometry_mensuration_m2,geometry,mensuration,B,1.0,1.0,B,1.0,B,0.98,B,1.0,B
Ministral-8B-Instruct-2410,geometry_mensuration_m3,geometry,mensuration,A,0.0,0.95,B,0.85,B,0.95,B,0.9,B
Ministral-8B-Instruct-2410,geometry_mensuration_h1,geometry,mensuration,A,1.0,0.95,B,0.75,A,0.9,A,1.0,A
Ministral-8B-Instruct-2410,geometry_mensuration_h2,geometry,mensuration,B,1.0,0.95,B,0.95,B,0.85,B,0.7,A
Ministral-8B-Instruct-2410,geometry_mensuration_h3,geometry,mensuration,B,0.0,0.95,A,0.8,A,0.65,A,0.7,A
Ministral-8B-Instruct-2410,geometry_trigonometry_e1,geometry,trigonometry,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,geometry_trigonometry_e2,geometry,trigonometry,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_trigonometry_e3,geometry,trigonometry,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,geometry_trigonometry_m1,geometry,trigonometry,B,1.0,0.95,B,0.75,B,0.95,B,0.9,A
Ministral-8B-Instruct-2410,geometry_trigonometry_m2,geometry,trigonometry,A,0.0,0.95,A,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,geometry_trigonometry_m3,geometry,trigonometry,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,geometry_trigonometry_h1,geometry,trigonometry,B,0.0,0.95,A,0.9,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,geometry_trigonometry_h2,geometry,trigonometry,A,0.0,0.95,B,0.85,B,0.6,B,0.95,A
Ministral-8B-Instruct-2410,geometry_trigonometry_h3,geometry,trigonometry,A,0.0,0.9,B,0.75,B,0.9,B,0.9,A
Ministral-8B-Instruct-2410,numbertheory_divisibility_e1,number theory,divisibility,A,1.0,0.9,B,0.95,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,numbertheory_divisibility_e2,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,numbertheory_divisibility_e3,number theory,divisibility,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,numbertheory_divisibility_m1,number theory,divisibility,A,0.0,1.0,B,1.0,B,1.0,B,1.0,A
Ministral-8B-Instruct-2410,numbertheory_divisibility_m2,number theory,divisibility,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,numbertheory_divisibility_m3,number theory,divisibility,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,numbertheory_divisibility_h1,number theory,divisibility,A,1.0,0.95,B,0.8,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,numbertheory_divisibility_h2,number theory,divisibility,B,1.0,0.9,B,0.9,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_divisibility_h3,number theory,divisibility,B,1.0,0.9,B,0.95,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_modular_e1,number theory,modular arithmetic,A,0.0,0.95,A,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,numbertheory_modular_e2,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,numbertheory_modular_e3,number theory,modular arithmetic,B,1.0,0.95,B,0.85,A,0.95,B,1.0,A
Ministral-8B-Instruct-2410,numbertheory_modular_m1,number theory,modular arithmetic,A,0.0,0.95,B,1.0,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,numbertheory_modular_m2,number theory,modular arithmetic,B,1.0,0.95,B,0.9,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_modular_m3,number theory,modular arithmetic,B,1.0,0.9,B,0.85,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_modular_h1,number theory,modular arithmetic,B,1.0,1.0,B,0.85,B,0.98,B,0.7,A
Ministral-8B-Instruct-2410,numbertheory_modular_h2,number theory,modular arithmetic,B,1.0,1.0,B,0.85,B,0.85,B,0.7,A
Ministral-8B-Instruct-2410,numbertheory_modular_h3,number theory,modular arithmetic,B,1.0,0.9,B,0.98,B,0.95,B,1.0,A
Ministral-8B-Instruct-2410,numbertheory_primes_e1,number theory,primes,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,numbertheory_primes_e2,number theory,primes,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_primes_e3,number theory,primes,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,numbertheory_primes_m1,number theory,primes,B,0.0,0.9,A,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,numbertheory_primes_m2,number theory,primes,B,0.0,0.95,A,1.0,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,numbertheory_primes_m3,number theory,primes,A,0.0,0.95,B,0.95,A,0.95,B,0.9,B
Ministral-8B-Instruct-2410,numbertheory_primes_h1,number theory,primes,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,numbertheory_primes_h2,number theory,primes,A,0.0,0.95,B,0.95,A,0.95,B,0.9,B
Ministral-8B-Instruct-2410,numbertheory_primes_h3,number theory,primes,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,numbertheory_diophantine_e1,number theory,diophantine equations,A,0.0,0.95,B,1.0,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,numbertheory_diophantine_e2,number theory,diophantine equations,B,1.0,0.9,B,0.9,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_diophantine_e3,number theory,diophantine equations,B,1.0,0.9,B,0.95,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_diophantine_m1,number theory,diophantine equations,B,1.0,0.95,B,0.85,A,0.95,B,0.8,A
Ministral-8B-Instruct-2410,numbertheory_diophantine_m2,number theory,diophantine equations,B,0.0,0.95,B,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,numbertheory_diophantine_m3,number theory,diophantine equations,B,1.0,0.95,B,1.0,B,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_diophantine_h1,number theory,diophantine equations,B,0.0,0.9,A,0.95,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,numbertheory_diophantine_h2,number theory,diophantine equations,A,1.0,0.9,A,0.95,A,0.9,A,0.95,B
Ministral-8B-Instruct-2410,numbertheory_diophantine_h3,number theory,diophantine equations,A,1.0,0.95,B,0.85,A,0.95,A,0.7,A
Ministral-8B-Instruct-2410,numbertheory_sequences_e1,number theory,number sequences,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,numbertheory_sequences_e2,number theory,number sequences,B,0.0,0.95,A,0.9,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,numbertheory_sequences_e3,number theory,number sequences,B,0.0,0.95,A,1.0,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,numbertheory_sequences_m1,number theory,number sequences,A,0.0,0.9,A,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,numbertheory_sequences_m2,number theory,number sequences,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,numbertheory_sequences_m3,number theory,number sequences,A,0.0,0.9,B,0.9,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,numbertheory_sequences_h1,number theory,number sequences,A,1.0,1.0,A,0.95,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,numbertheory_sequences_h2,number theory,number sequences,A,1.0,0.95,A,0.55,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,numbertheory_sequences_h3,number theory,number sequences,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_counting_e1,combinatorics,counting principles,B,1.0,0.95,B,0.9,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,combinatorics_counting_e2,combinatorics,counting principles,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,combinatorics_counting_e3,combinatorics,counting principles,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_counting_m1,combinatorics,counting principles,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,combinatorics_counting_m2,combinatorics,counting principles,B,0.0,0.9,A,0.85,A,0.95,B,0.9,A
Ministral-8B-Instruct-2410,combinatorics_counting_m3,combinatorics,counting principles,A,1.0,1.0,A,0.8,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,combinatorics_counting_h1,combinatorics,counting principles,B,1.0,1.0,B,0.7,B,0.5,A,0.6,B
Ministral-8B-Instruct-2410,combinatorics_counting_h2,combinatorics,counting principles,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_counting_h3,combinatorics,counting principles,A,0.0,1.0,B,0.75,A,0.85,B,0.7,A
Ministral-8B-Instruct-2410,combinatorics_permutations_e1,combinatorics,permutations,A,0.0,0.9,B,0.85,A,0.9,B,0.9,A
Ministral-8B-Instruct-2410,combinatorics_permutations_e2,combinatorics,permutations,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,combinatorics_permutations_e3,combinatorics,permutations,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,combinatorics_permutations_m1,combinatorics,permutations,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
Ministral-8B-Instruct-2410,combinatorics_permutations_m2,combinatorics,permutations,A,0.0,1.0,B,0.85,B,0.85,,,B
Ministral-8B-Instruct-2410,combinatorics_permutations_m3,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.95,B,1.0,B
Ministral-8B-Instruct-2410,combinatorics_permutations_h1,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_permutations_h2,combinatorics,permutations,B,0.0,0.9,A,0.75,A,1.0,A,0.8,B
Ministral-8B-Instruct-2410,combinatorics_permutations_h3,combinatorics,permutations,B,0.0,0.95,A,0.75,A,0.7,A,0.6,B
Ministral-8B-Instruct-2410,combinatorics_combinations_e1,combinatorics,combinations,B,0.0,0.95,A,0.9,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,combinatorics_combinations_e2,combinatorics,combinations,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,combinatorics_combinations_e3,combinatorics,combinations,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,combinatorics_combinations_m1,combinatorics,combinations,B,0.0,0.9,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_combinations_m2,combinatorics,combinations,B,1.0,0.9,B,0.95,B,0.95,B,0.9,B
Ministral-8B-Instruct-2410,combinatorics_combinations_m3,combinatorics,combinations,A,0.0,0.9,B,0.9,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,combinatorics_combinations_h1,combinatorics,combinations,B,1.0,0.95,B,0.85,A,0.95,B,1.0,A
Ministral-8B-Instruct-2410,combinatorics_combinations_h2,combinatorics,combinations,A,1.0,1.0,A,1.0,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,combinatorics_combinations_h3,combinatorics,combinations,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
Ministral-8B-Instruct-2410,combinatorics_probability_e1,combinatorics,probability,B,1.0,0.95,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,combinatorics_probability_e2,combinatorics,probability,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_probability_e3,combinatorics,probability,A,0.0,1.0,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,combinatorics_probability_m1,combinatorics,probability,B,1.0,0.95,B,0.92,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,combinatorics_probability_m2,combinatorics,probability,A,1.0,0.9,B,0.75,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_probability_m3,combinatorics,probability,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_probability_h1,combinatorics,probability,A,1.0,1.0,A,0.98,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,combinatorics_probability_h2,combinatorics,probability,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_probability_h3,combinatorics,probability,B,1.0,0.95,B,0.95,B,0.95,B,1.0,A
Ministral-8B-Instruct-2410,combinatorics_recursion_e1,combinatorics,recursion,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,combinatorics_recursion_e2,combinatorics,recursion,B,1.0,1.0,B,0.98,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,combinatorics_recursion_e3,combinatorics,recursion,B,0.0,1.0,A,0.85,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,combinatorics_recursion_m1,combinatorics,recursion,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,combinatorics_recursion_m2,combinatorics,recursion,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,combinatorics_recursion_m3,combinatorics,recursion,A,0.0,0.9,B,0.85,B,0.9,B,0.7,B
Ministral-8B-Instruct-2410,combinatorics_recursion_h1,combinatorics,recursion,B,1.0,0.95,B,1.0,B,0.98,B,1.0,A
Ministral-8B-Instruct-2410,combinatorics_recursion_h2,combinatorics,recursion,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,combinatorics_recursion_h3,combinatorics,recursion,B,0.0,0.95,A,0.9,A,0.95,A,0.8,B
Ministral-8B-Instruct-2410,statistics_descriptive_e1,statistics,descriptive statistics,B,1.0,0.9,B,0.98,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,statistics_descriptive_e2,statistics,descriptive statistics,A,0.0,0.9,B,0.85,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,statistics_descriptive_e3,statistics,descriptive statistics,B,1.0,0.95,B,0.85,A,0.95,B,1.0,A
Ministral-8B-Instruct-2410,statistics_descriptive_m1,statistics,descriptive statistics,A,0.0,0.95,B,0.9,B,0.95,B,0.9,B
Ministral-8B-Instruct-2410,statistics_descriptive_m2,statistics,descriptive statistics,B,1.0,0.9,B,0.95,B,0.85,A,0.9,A
Ministral-8B-Instruct-2410,statistics_descriptive_m3,statistics,descriptive statistics,A,0.0,0.95,B,0.95,B,0.85,B,0.9,B
Ministral-8B-Instruct-2410,statistics_descriptive_h1,statistics,descriptive statistics,A,1.0,0.95,A,0.9,A,0.95,A,0.8,A
Ministral-8B-Instruct-2410,statistics_descriptive_h2,statistics,descriptive statistics,B,1.0,0.95,B,0.65,B,0.85,B,0.75,A
Ministral-8B-Instruct-2410,statistics_descriptive_h3,statistics,descriptive statistics,B,1.0,0.95,B,1.0,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,statistics_distributions_e1,statistics,distributions,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,statistics_distributions_e2,statistics,distributions,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,statistics_distributions_e3,statistics,distributions,A,1.0,0.95,A,0.95,B,0.95,A,0.95,B
Ministral-8B-Instruct-2410,statistics_distributions_m1,statistics,distributions,B,0.0,0.9,A,0.95,A,0.95,A,0.85,A
Ministral-8B-Instruct-2410,statistics_distributions_m2,statistics,distributions,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Ministral-8B-Instruct-2410,statistics_distributions_m3,statistics,distributions,B,0.0,0.85,A,0.95,A,0.9,A,0.8,B
Ministral-8B-Instruct-2410,statistics_distributions_h1,statistics,distributions,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,statistics_distributions_h2,statistics,distributions,B,0.0,0.9,A,0.95,A,0.98,A,1.0,A
Ministral-8B-Instruct-2410,statistics_distributions_h3,statistics,distributions,B,1.0,0.95,B,0.95,B,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_hypothesis_e1,statistics,hypothesis testing,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_hypothesis_e2,statistics,hypothesis testing,A,1.0,0.9,B,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,statistics_hypothesis_e3,statistics,hypothesis testing,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,statistics_hypothesis_m1,statistics,hypothesis testing,B,0.0,0.95,B,0.85,A,0.95,A,0.9,A
Ministral-8B-Instruct-2410,statistics_hypothesis_m2,statistics,hypothesis testing,B,1.0,0.95,B,0.85,B,0.95,A,0.7,A
Ministral-8B-Instruct-2410,statistics_hypothesis_m3,statistics,hypothesis testing,A,0.0,0.9,B,0.9,B,0.85,B,0.9,B
Ministral-8B-Instruct-2410,statistics_hypothesis_h1,statistics,hypothesis testing,A,1.0,0.95,B,0.65,A,0.75,,,B
Ministral-8B-Instruct-2410,statistics_hypothesis_h2,statistics,hypothesis testing,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,statistics_hypothesis_h3,statistics,hypothesis testing,B,0.0,0.9,A,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_regression_e1,statistics,regression,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_regression_e2,statistics,regression,A,1.0,0.9,A,0.85,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,statistics_regression_e3,statistics,regression,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_regression_m1,statistics,regression,A,0.0,0.95,B,0.85,A,0.95,B,0.9,A
Ministral-8B-Instruct-2410,statistics_regression_m2,statistics,regression,A,1.0,0.9,A,0.9,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,statistics_regression_m3,statistics,regression,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_regression_h1,statistics,regression,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_regression_h2,statistics,regression,A,0.0,1.0,B,0.95,B,1.0,B,1.0,A
Ministral-8B-Instruct-2410,statistics_regression_h3,statistics,regression,B,1.0,0.95,B,0.95,A,0.9,B,0.85,A
Ministral-8B-Instruct-2410,statistics_bayesian_e1,statistics,bayesian inference,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,statistics_bayesian_e2,statistics,bayesian inference,B,0.0,0.75,A,0.6,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_bayesian_e3,statistics,bayesian inference,B,1.0,0.95,B,0.9,B,0.98,B,0.95,B
Ministral-8B-Instruct-2410,statistics_bayesian_m1,statistics,bayesian inference,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,statistics_bayesian_m2,statistics,bayesian inference,A,1.0,1.0,A,0.85,A,0.9,A,0.7,B
Ministral-8B-Instruct-2410,statistics_bayesian_m3,statistics,bayesian inference,A,0.0,0.95,B,0.98,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,statistics_bayesian_h1,statistics,bayesian inference,B,0.0,0.95,A,0.75,A,0.9,A,0.8,A
Ministral-8B-Instruct-2410,statistics_bayesian_h2,statistics,bayesian inference,A,1.0,0.95,B,0.65,A,0.85,A,0.7,B
Ministral-8B-Instruct-2410,statistics_bayesian_h3,statistics,bayesian inference,A,0.0,0.95,B,0.98,B,0.98,B,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_matrices_e1,linear algebra,matrices,A,1.0,0.9,A,1.0,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_matrices_e2,linear algebra,matrices,B,1.0,1.0,B,0.95,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_matrices_e3,linear algebra,matrices,A,1.0,1.0,A,0.98,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_matrices_m1,linear algebra,matrices,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_matrices_m2,linear algebra,matrices,A,1.0,0.95,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_matrices_m3,linear algebra,matrices,B,1.0,0.95,B,0.9,B,0.95,A,0.75,A
Ministral-8B-Instruct-2410,linearalgebra_matrices_h1,linear algebra,matrices,A,0.0,1.0,B,0.9,B,0.9,B,0.95,B
Ministral-8B-Instruct-2410,linearalgebra_matrices_h2,linear algebra,matrices,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_matrices_h3,linear algebra,matrices,A,1.0,0.9,A,1.0,A,0.98,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_determinants_e1,linear algebra,determinants,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,linearalgebra_determinants_e2,linear algebra,determinants,B,0.0,0.95,A,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_determinants_e3,linear algebra,determinants,A,0.0,0.95,A,0.85,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_determinants_m1,linear algebra,determinants,B,1.0,1.0,B,1.0,B,1.0,B,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_determinants_m2,linear algebra,determinants,B,0.0,0.85,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_determinants_m3,linear algebra,determinants,A,1.0,0.9,A,0.95,A,0.95,A,0.95,B
Ministral-8B-Instruct-2410,linearalgebra_determinants_h1,linear algebra,determinants,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_determinants_h2,linear algebra,determinants,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,linearalgebra_determinants_h3,linear algebra,determinants,B,1.0,0.95,B,0.95,B,0.95,A,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,B,0.0,0.95,A,0.85,A,0.95,B,0.9,A
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,B,0.0,0.95,A,0.8,A,0.85,A,0.7,A
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,B,1.0,0.9,B,1.0,B,0.95,B,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,B,1.0,0.9,B,0.95,B,0.85,B,0.7,B
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,B,0.0,1.0,A,0.95,A,0.9,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,B,0.0,0.9,A,1.0,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,B,1.0,0.95,B,0.85,B,0.85,B,0.7,A
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,B,1.0,1.0,B,0.85,A,0.95,B,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,B,1.0,1.0,B,0.75,A,0.95,B,0.95,B
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,1.0,1.0,A,1.0,A,1.0,A,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,B,0.0,0.95,A,0.85,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,B,1.0,1.0,B,1.0,B,1.0,B,0.95,A
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,0.0,0.95,B,0.65,B,0.95,A,0.9,B
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,A,0.0,0.95,B,0.75,B,0.7,,,B
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,B,0.0,0.95,B,0.75,A,0.9,A,0.7,A
Ministral-8B-Instruct-2410,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
Ministral-8B-Instruct-2410,linearalgebra_transformations_e1,linear algebra,linear transformations,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,linearalgebra_transformations_e2,linear algebra,linear transformations,B,1.0,0.9,B,1.0,B,0.95,B,0.9,A
Ministral-8B-Instruct-2410,linearalgebra_transformations_e3,linear algebra,linear transformations,A,1.0,0.9,A,0.95,A,0.95,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_transformations_m1,linear algebra,linear transformations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Ministral-8B-Instruct-2410,linearalgebra_transformations_m2,linear algebra,linear transformations,B,0.0,0.95,A,0.75,A,0.95,A,0.9,B
Ministral-8B-Instruct-2410,linearalgebra_transformations_m3,linear algebra,linear transformations,A,1.0,1.0,A,1.0,A,1.0,A,1.0,A
Ministral-8B-Instruct-2410,linearalgebra_transformations_h1,linear algebra,linear transformations,A,0.0,0.95,B,0.8,B,0.75,,,A
Ministral-8B-Instruct-2410,linearalgebra_transformations_h2,linear algebra,linear transformations,B,1.0,0.95,B,0.65,B,0.75,B,0.6,A
Ministral-8B-Instruct-2410,linearalgebra_transformations_h3,linear algebra,linear transformations,A,0.0,0.9,B,0.85,A,0.6,,,A
Open-Reasoner-Zero-7B,arithmetic_basic_operations_e1,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
Open-Reasoner-Zero-7B,arithmetic_basic_operations_e2,arithmetic,basic operations,B,0.0,0.95,A,0.95,A,0.95,B,1.0,A
Open-Reasoner-Zero-7B,arithmetic_basic_operations_e3,arithmetic,basic operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_basic_operations_m1,arithmetic,basic operations,A,0.0,0.95,B,0.95,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,arithmetic_basic_operations_m2,arithmetic,basic operations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_basic_operations_m3,arithmetic,basic operations,A,1.0,1.0,A,0.95,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,arithmetic_basic_operations_h1,arithmetic,basic operations,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_basic_operations_h2,arithmetic,basic operations,B,1.0,0.85,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_basic_operations_h3,arithmetic,basic operations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_fractions_e1,arithmetic,fractions,B,1.0,0.95,B,0.85,A,0.95,B,1.0,A
Open-Reasoner-Zero-7B,arithmetic_fractions_e2,arithmetic,fractions,A,1.0,0.9,B,0.65,A,0.95,A,1.0,B
Open-Reasoner-Zero-7B,arithmetic_fractions_e3,arithmetic,fractions,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_fractions_m1,arithmetic,fractions,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_fractions_m2,arithmetic,fractions,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_fractions_m3,arithmetic,fractions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,0.95,B,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_fractions_h2,arithmetic,fractions,A,0.0,1.0,B,0.85,A,0.95,B,0.8,A
Open-Reasoner-Zero-7B,arithmetic_fractions_h3,arithmetic,fractions,A,0.0,1.0,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_percentages_e1,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_percentages_e2,arithmetic,percentages,A,1.0,0.95,B,0.95,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_percentages_e3,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_percentages_m1,arithmetic,percentages,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_percentages_m2,arithmetic,percentages,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_percentages_m3,arithmetic,percentages,B,1.0,0.95,B,0.95,B,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_percentages_h1,arithmetic,percentages,A,0.0,1.0,B,0.95,B,0.95,B,1.0,A
Open-Reasoner-Zero-7B,arithmetic_percentages_h2,arithmetic,percentages,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_percentages_h3,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Open-Reasoner-Zero-7B,arithmetic_numerical_e1,arithmetic,numerical approximation,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_numerical_e2,arithmetic,numerical approximation,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_numerical_e3,arithmetic,numerical approximation,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_numerical_m1,arithmetic,numerical approximation,B,1.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_numerical_m2,arithmetic,numerical approximation,A,0.0,0.95,B,0.85,B,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_numerical_h1,arithmetic,numerical approximation,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_numerical_h2,arithmetic,numerical approximation,A,0.0,0.9,B,0.85,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,arithmetic_numerical_h3,arithmetic,numerical approximation,B,0.0,0.95,B,0.8,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_order_e1,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_order_e2,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,arithmetic_order_e3,arithmetic,order of operations,A,1.0,1.0,B,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_order_m1,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,arithmetic_order_m2,arithmetic,order of operations,A,1.0,1.0,A,0.9,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_order_m3,arithmetic,order of operations,A,0.0,1.0,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_order_h1,arithmetic,order of operations,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,arithmetic_order_h2,arithmetic,order of operations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,arithmetic_order_h3,arithmetic,order of operations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_equations_e1,algebra,equations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,algebra_equations_e2,algebra,equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,algebra_equations_e3,algebra,equations,B,1.0,0.95,B,0.95,B,0.95,B,1.0,B
Open-Reasoner-Zero-7B,algebra_equations_m1,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_equations_m2,algebra,equations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_equations_m3,algebra,equations,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_equations_h1,algebra,equations,A,0.0,1.0,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,algebra_equations_h2,algebra,equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_equations_h3,algebra,equations,A,0.0,0.85,B,0.55,A,0.65,B,0.7,B
Open-Reasoner-Zero-7B,algebra_inequalities_e1,algebra,inequalities,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_inequalities_e2,algebra,inequalities,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,algebra_inequalities_e3,algebra,inequalities,A,1.0,0.85,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_inequalities_m1,algebra,inequalities,A,1.0,0.95,A,0.8,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_inequalities_m2,algebra,inequalities,A,1.0,0.95,B,0.7,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,algebra_inequalities_m3,algebra,inequalities,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_inequalities_h1,algebra,inequalities,A,1.0,1.0,B,0.85,A,0.95,A,0.85,B
Open-Reasoner-Zero-7B,algebra_inequalities_h2,algebra,inequalities,B,0.0,0.95,A,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_inequalities_h3,algebra,inequalities,A,1.0,0.95,A,0.7,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,algebra_polynomials_e1,algebra,polynomials,A,0.0,0.85,B,0.6,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_polynomials_e2,algebra,polynomials,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_polynomials_e3,algebra,polynomials,A,0.0,0.95,B,0.6,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,algebra_polynomials_m1,algebra,polynomials,A,1.0,0.95,A,0.75,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_polynomials_m2,algebra,polynomials,A,1.0,0.95,A,0.8,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,algebra_polynomials_m3,algebra,polynomials,A,0.0,0.9,B,0.95,B,0.98,B,1.0,A
Open-Reasoner-Zero-7B,algebra_polynomials_h1,algebra,polynomials,A,1.0,0.95,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,algebra_polynomials_h2,algebra,polynomials,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_polynomials_h3,algebra,polynomials,A,0.0,0.0,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,algebra_functions_e1,algebra,functions,A,1.0,0.95,A,0.95,A,0.95,A,0.9,A
Open-Reasoner-Zero-7B,algebra_functions_e2,algebra,functions,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_functions_e3,algebra,functions,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
Open-Reasoner-Zero-7B,algebra_functions_m1,algebra,functions,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_functions_m2,algebra,functions,A,0.0,0.95,B,0.9,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,algebra_functions_m3,algebra,functions,A,0.0,0.95,B,0.95,A,0.98,B,0.95,A
Open-Reasoner-Zero-7B,algebra_functions_h1,algebra,functions,A,1.0,1.0,B,0.6,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_functions_h2,algebra,functions,A,1.0,0.95,A,0.55,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,algebra_functions_h3,algebra,functions,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_systems_e1,algebra,systems of equations,A,1.0,0.95,A,0.9,A,0.95,A,1.0,B
Open-Reasoner-Zero-7B,algebra_systems_e2,algebra,systems of equations,A,1.0,1.0,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,algebra_systems_e3,algebra,systems of equations,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,algebra_systems_m1,algebra,systems of equations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,algebra_systems_m2,algebra,systems of equations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,algebra_systems_m3,algebra,systems of equations,A,1.0,0.95,A,1.0,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,algebra_systems_h1,algebra,systems of equations,A,1.0,0.95,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,algebra_systems_h2,algebra,systems of equations,A,0.0,0.95,B,0.85,A,0.99,B,0.95,A
Open-Reasoner-Zero-7B,algebra_systems_h3,algebra,systems of equations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_differentiation_e1,calculus,differentiation,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_differentiation_e2,calculus,differentiation,A,0.0,0.85,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_differentiation_e3,calculus,differentiation,A,1.0,0.95,B,0.75,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_differentiation_m1,calculus,differentiation,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_differentiation_m2,calculus,differentiation,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_differentiation_m3,calculus,differentiation,A,0.0,0.85,A,0.9,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_differentiation_h1,calculus,differentiation,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_differentiation_h2,calculus,differentiation,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_differentiation_h3,calculus,differentiation,A,1.0,0.95,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,calculus_integration_e1,calculus,integration,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_integration_e2,calculus,integration,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_integration_e3,calculus,integration,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_integration_m1,calculus,integration,A,0.0,1.0,B,0.95,A,0.98,B,0.95,A
Open-Reasoner-Zero-7B,calculus_integration_m2,calculus,integration,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_integration_m3,calculus,integration,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,calculus_integration_h1,calculus,integration,A,1.0,1.0,A,0.55,A,1.0,A,0.95,B
Open-Reasoner-Zero-7B,calculus_integration_h2,calculus,integration,A,0.0,1.0,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,calculus_integration_h3,calculus,integration,A,1.0,0.95,B,0.85,A,0.95,A,1.0,A
Open-Reasoner-Zero-7B,calculus_limits_e1,calculus,limits,A,1.0,0.95,A,0.95,A,0.95,A,0.9,A
Open-Reasoner-Zero-7B,calculus_limits_e2,calculus,limits,A,1.0,0.95,A,0.85,A,0.98,A,0.9,A
Open-Reasoner-Zero-7B,calculus_limits_e3,calculus,limits,A,1.0,0.95,B,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,calculus_limits_m1,calculus,limits,A,0.0,0.95,B,0.8,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_limits_m2,calculus,limits,A,1.0,0.95,A,0.75,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,calculus_limits_m3,calculus,limits,A,1.0,1.0,A,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,calculus_limits_h1,calculus,limits,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_limits_h2,calculus,limits,A,0.0,1.0,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,calculus_limits_h3,calculus,limits,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_series_e1,calculus,series,A,1.0,0.95,A,0.85,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,calculus_series_e2,calculus,series,B,0.0,0.95,A,0.75,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_series_e3,calculus,series,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_series_m1,calculus,series,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_series_m2,calculus,series,A,1.0,0.95,A,0.8,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_series_m3,calculus,series,A,1.0,1.0,A,0.55,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,calculus_series_h1,calculus,series,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_series_h2,calculus,series,A,0.0,0.9,B,0.9,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_series_h3,calculus,series,A,0.0,0.95,B,0.95,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_applications_e1,calculus,applications,A,1.0,0.9,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_applications_e2,calculus,applications,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_applications_e3,calculus,applications,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,calculus_applications_m1,calculus,applications,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,calculus_applications_m2,calculus,applications,A,0.0,0.95,B,0.65,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_applications_m3,calculus,applications,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_applications_h1,calculus,applications,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,calculus_applications_h2,calculus,applications,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,calculus_applications_h3,calculus,applications,A,1.0,0.95,A,0.95,A,0.95,A,0.8,A
Open-Reasoner-Zero-7B,geometry_plane_e1,geometry,plane geometry,A,0.0,0.95,B,0.95,B,0.95,B,0.9,B
Open-Reasoner-Zero-7B,geometry_plane_e2,geometry,plane geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_plane_e3,geometry,plane geometry,A,0.0,1.0,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_plane_m1,geometry,plane geometry,A,1.0,0.95,A,0.85,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,geometry_plane_m2,geometry,plane geometry,A,0.0,1.0,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_plane_m3,geometry,plane geometry,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Open-Reasoner-Zero-7B,geometry_plane_h1,geometry,plane geometry,A,1.0,0.95,B,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_plane_h2,geometry,plane geometry,A,1.0,1.0,A,0.7,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_plane_h3,geometry,plane geometry,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_coordinate_e1,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_coordinate_e2,geometry,coordinate geometry,A,1.0,0.95,A,0.85,A,0.95,A,1.0,B
Open-Reasoner-Zero-7B,geometry_coordinate_e3,geometry,coordinate geometry,A,1.0,1.0,B,0.75,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,geometry_coordinate_m1,geometry,coordinate geometry,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
Open-Reasoner-Zero-7B,geometry_coordinate_m2,geometry,coordinate geometry,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,geometry_coordinate_m3,geometry,coordinate geometry,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_coordinate_h1,geometry,coordinate geometry,A,1.0,0.95,B,0.6,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_coordinate_h2,geometry,coordinate geometry,A,0.0,0.95,B,0.9,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,geometry_coordinate_h3,geometry,coordinate geometry,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_transformations_e1,geometry,transformations,B,0.0,0.95,A,0.75,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_transformations_e2,geometry,transformations,A,1.0,0.95,A,0.8,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,geometry_transformations_e3,geometry,transformations,A,1.0,0.95,A,0.9,A,0.98,A,1.0,B
Open-Reasoner-Zero-7B,geometry_transformations_m1,geometry,transformations,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_transformations_m2,geometry,transformations,B,0.0,0.9,A,0.75,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_transformations_m3,geometry,transformations,B,0.0,0.95,A,0.7,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_transformations_h1,geometry,transformations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_transformations_h2,geometry,transformations,A,1.0,0.95,A,1.0,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,geometry_transformations_h3,geometry,transformations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_mensuration_e1,geometry,mensuration,A,0.0,0.95,B,0.95,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,geometry_mensuration_e2,geometry,mensuration,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_mensuration_e3,geometry,mensuration,A,0.0,0.95,B,0.85,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,geometry_mensuration_m1,geometry,mensuration,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_mensuration_m2,geometry,mensuration,A,1.0,1.0,A,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_mensuration_m3,geometry,mensuration,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_mensuration_h1,geometry,mensuration,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_mensuration_h2,geometry,mensuration,B,0.0,0.7,B,0.85,A,0.7,A,0.7,A
Open-Reasoner-Zero-7B,geometry_mensuration_h3,geometry,mensuration,A,0.0,0.85,B,0.6,A,0.6,B,0.6,A
Open-Reasoner-Zero-7B,geometry_trigonometry_e1,geometry,trigonometry,A,0.0,0.85,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_trigonometry_e2,geometry,trigonometry,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
Open-Reasoner-Zero-7B,geometry_trigonometry_e3,geometry,trigonometry,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_trigonometry_m1,geometry,trigonometry,B,0.0,0.95,A,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_trigonometry_m2,geometry,trigonometry,A,1.0,0.9,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,geometry_trigonometry_m3,geometry,trigonometry,A,1.0,1.0,A,0.9,A,0.95,A,1.0,A
Open-Reasoner-Zero-7B,geometry_trigonometry_h1,geometry,trigonometry,A,1.0,0.95,A,0.55,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,geometry_trigonometry_h2,geometry,trigonometry,B,0.0,0.8,A,0.65,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,geometry_trigonometry_h3,geometry,trigonometry,A,1.0,1.0,B,0.85,A,0.9,A,0.8,A
Open-Reasoner-Zero-7B,numbertheory_divisibility_e1,number theory,divisibility,A,0.0,0.95,B,0.95,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,numbertheory_divisibility_e2,number theory,divisibility,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_divisibility_e3,number theory,divisibility,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_divisibility_m1,number theory,divisibility,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_divisibility_m2,number theory,divisibility,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_divisibility_m3,number theory,divisibility,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_divisibility_h1,number theory,divisibility,A,1.0,0.95,A,0.95,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_divisibility_h2,number theory,divisibility,B,1.0,0.95,B,0.9,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_divisibility_h3,number theory,divisibility,A,1.0,1.0,B,0.6,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_modular_e1,number theory,modular arithmetic,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_modular_e2,number theory,modular arithmetic,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_modular_e3,number theory,modular arithmetic,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_modular_m1,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_modular_m2,number theory,modular arithmetic,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_modular_m3,number theory,modular arithmetic,A,1.0,0.95,A,0.7,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_modular_h1,number theory,modular arithmetic,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_modular_h2,number theory,modular arithmetic,A,1.0,1.0,A,0.9,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_modular_h3,number theory,modular arithmetic,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_primes_e1,number theory,primes,B,0.0,0.95,A,0.85,A,0.95,B,0.9,B
Open-Reasoner-Zero-7B,numbertheory_primes_e2,number theory,primes,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Open-Reasoner-Zero-7B,numbertheory_primes_e3,number theory,primes,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_primes_m1,number theory,primes,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_primes_m2,number theory,primes,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_primes_m3,number theory,primes,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_primes_h1,number theory,primes,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_primes_h2,number theory,primes,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_primes_h3,number theory,primes,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_diophantine_e1,number theory,diophantine equations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_diophantine_e2,number theory,diophantine equations,A,1.0,0.95,A,0.85,A,0.95,A,1.0,B
Open-Reasoner-Zero-7B,numbertheory_diophantine_e3,number theory,diophantine equations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_diophantine_m1,number theory,diophantine equations,A,1.0,0.95,B,0.55,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_diophantine_m2,number theory,diophantine equations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_diophantine_m3,number theory,diophantine equations,A,1.0,1.0,A,0.51,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_diophantine_h1,number theory,diophantine equations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_diophantine_h2,number theory,diophantine equations,A,1.0,0.95,A,1.0,A,0.98,A,1.0,A
Open-Reasoner-Zero-7B,numbertheory_diophantine_h3,number theory,diophantine equations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_sequences_e1,number theory,number sequences,A,1.0,0.95,A,0.85,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_sequences_e2,number theory,number sequences,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_sequences_e3,number theory,number sequences,A,1.0,1.0,B,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_sequences_m1,number theory,number sequences,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_sequences_m2,number theory,number sequences,A,1.0,0.95,B,0.65,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,numbertheory_sequences_m3,number theory,number sequences,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,numbertheory_sequences_h1,number theory,number sequences,A,0.0,0.95,B,0.8,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,numbertheory_sequences_h2,number theory,number sequences,A,1.0,1.0,A,0.85,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,numbertheory_sequences_h3,number theory,number sequences,B,1.0,0.95,B,0.95,B,0.98,B,1.0,A
Open-Reasoner-Zero-7B,combinatorics_counting_e1,combinatorics,counting principles,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,combinatorics_counting_e2,combinatorics,counting principles,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,combinatorics_counting_e3,combinatorics,counting principles,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,combinatorics_counting_m1,combinatorics,counting principles,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_counting_m2,combinatorics,counting principles,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,combinatorics_counting_m3,combinatorics,counting principles,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_counting_h1,combinatorics,counting principles,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,combinatorics_counting_h2,combinatorics,counting principles,A,1.0,1.0,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_counting_h3,combinatorics,counting principles,A,1.0,0.95,A,0.85,A,0.9,,,A
Open-Reasoner-Zero-7B,combinatorics_permutations_e1,combinatorics,permutations,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_permutations_e2,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_permutations_e3,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_permutations_m1,combinatorics,permutations,A,1.0,1.0,A,0.85,B,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_permutations_m2,combinatorics,permutations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,combinatorics_permutations_m3,combinatorics,permutations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,combinatorics_permutations_h1,combinatorics,permutations,A,1.0,1.0,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_permutations_h2,combinatorics,permutations,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_permutations_h3,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.85,A,0.7,A
Open-Reasoner-Zero-7B,combinatorics_combinations_e1,combinatorics,combinations,A,0.0,0.95,B,0.95,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_combinations_e2,combinatorics,combinations,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,combinatorics_combinations_e3,combinatorics,combinations,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,combinatorics_combinations_m1,combinatorics,combinations,A,1.0,1.0,B,0.85,A,0.95,A,1.0,A
Open-Reasoner-Zero-7B,combinatorics_combinations_m2,combinatorics,combinations,A,0.0,1.0,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_combinations_m3,combinatorics,combinations,A,1.0,0.95,B,0.6,A,1.0,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_combinations_h1,combinatorics,combinations,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_combinations_h2,combinatorics,combinations,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
Open-Reasoner-Zero-7B,combinatorics_combinations_h3,combinatorics,combinations,A,0.0,1.0,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_probability_e1,combinatorics,probability,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_probability_e2,combinatorics,probability,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_probability_e3,combinatorics,probability,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_probability_m1,combinatorics,probability,A,0.0,1.0,B,0.95,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,combinatorics_probability_m2,combinatorics,probability,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_probability_m3,combinatorics,probability,A,0.0,1.0,B,0.7,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,combinatorics_probability_h1,combinatorics,probability,A,1.0,0.95,A,1.0,A,0.98,A,1.0,B
Open-Reasoner-Zero-7B,combinatorics_probability_h2,combinatorics,probability,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_probability_h3,combinatorics,probability,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_recursion_e1,combinatorics,recursion,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,combinatorics_recursion_e2,combinatorics,recursion,A,1.0,1.0,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_recursion_e3,combinatorics,recursion,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,combinatorics_recursion_m1,combinatorics,recursion,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,combinatorics_recursion_m2,combinatorics,recursion,A,1.0,0.95,B,0.9,A,0.95,A,1.0,A
Open-Reasoner-Zero-7B,combinatorics_recursion_m3,combinatorics,recursion,A,0.0,0.95,A,0.85,B,0.9,,,A
Open-Reasoner-Zero-7B,combinatorics_recursion_h1,combinatorics,recursion,A,1.0,0.95,A,0.6,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_recursion_h2,combinatorics,recursion,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,combinatorics_recursion_h3,combinatorics,recursion,B,1.0,0.95,B,0.85,B,0.95,,,B
Open-Reasoner-Zero-7B,statistics_descriptive_e1,statistics,descriptive statistics,A,1.0,1.0,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,1.0,A,0.9,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_descriptive_m1,statistics,descriptive statistics,A,0.0,1.0,B,0.85,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,statistics_descriptive_m2,statistics,descriptive statistics,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_descriptive_m3,statistics,descriptive statistics,A,0.0,0.95,B,0.85,B,0.95,,,B
Open-Reasoner-Zero-7B,statistics_descriptive_h1,statistics,descriptive statistics,A,0.0,0.95,B,0.95,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,statistics_descriptive_h2,statistics,descriptive statistics,A,1.0,0.95,A,0.75,B,0.85,A,0.9,B
Open-Reasoner-Zero-7B,statistics_descriptive_h3,statistics,descriptive statistics,A,1.0,1.0,B,0.75,A,0.95,,,B
Open-Reasoner-Zero-7B,statistics_distributions_e1,statistics,distributions,A,0.0,1.0,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,statistics_distributions_e2,statistics,distributions,B,0.0,0.95,B,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_distributions_e3,statistics,distributions,A,0.0,0.95,B,0.9,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,statistics_distributions_m1,statistics,distributions,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_distributions_m2,statistics,distributions,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_distributions_m3,statistics,distributions,A,1.0,1.0,A,0.9,A,0.98,A,1.0,B
Open-Reasoner-Zero-7B,statistics_distributions_h1,statistics,distributions,A,0.0,1.0,B,0.55,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,statistics_distributions_h2,statistics,distributions,A,0.0,0.95,B,0.9,B,0.98,B,1.0,A
Open-Reasoner-Zero-7B,statistics_distributions_h3,statistics,distributions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_hypothesis_e1,statistics,hypothesis testing,A,1.0,0.85,A,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_hypothesis_e2,statistics,hypothesis testing,A,1.0,0.9,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_hypothesis_e3,statistics,hypothesis testing,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_hypothesis_m1,statistics,hypothesis testing,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_hypothesis_m2,statistics,hypothesis testing,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,statistics_hypothesis_m3,statistics,hypothesis testing,A,0.0,0.95,B,0.95,B,0.95,B,0.8,A
Open-Reasoner-Zero-7B,statistics_hypothesis_h1,statistics,hypothesis testing,A,1.0,1.0,A,0.7,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,statistics_hypothesis_h2,statistics,hypothesis testing,B,1.0,0.95,B,0.85,B,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_hypothesis_h3,statistics,hypothesis testing,A,1.0,0.95,A,0.8,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_regression_e1,statistics,regression,A,0.0,0.9,B,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,statistics_regression_e2,statistics,regression,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,statistics_regression_e3,statistics,regression,A,1.0,0.95,B,0.65,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_regression_m1,statistics,regression,A,1.0,0.9,A,0.85,A,0.95,A,0.7,A
Open-Reasoner-Zero-7B,statistics_regression_m2,statistics,regression,A,0.0,0.95,A,0.85,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,statistics_regression_m3,statistics,regression,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,statistics_regression_h1,statistics,regression,A,0.0,0.95,B,0.85,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,statistics_regression_h2,statistics,regression,A,1.0,0.95,A,0.95,A,0.98,B,0.9,B
Open-Reasoner-Zero-7B,statistics_regression_h3,statistics,regression,A,1.0,1.0,B,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_bayesian_e1,statistics,bayesian inference,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_bayesian_e2,statistics,bayesian inference,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_bayesian_e3,statistics,bayesian inference,A,0.0,1.0,B,0.85,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,statistics_bayesian_m1,statistics,bayesian inference,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,statistics_bayesian_m2,statistics,bayesian inference,A,1.0,1.0,A,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,statistics_bayesian_m3,statistics,bayesian inference,A,0.0,1.0,B,0.95,B,0.98,B,1.0,A
Open-Reasoner-Zero-7B,statistics_bayesian_h1,statistics,bayesian inference,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,statistics_bayesian_h2,statistics,bayesian inference,A,1.0,0.95,A,1.0,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,statistics_bayesian_h3,statistics,bayesian inference,A,1.0,1.0,A,0.95,A,0.99,A,1.0,B
Open-Reasoner-Zero-7B,linearalgebra_matrices_e1,linear algebra,matrices,A,1.0,0.95,A,0.85,B,0.95,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_matrices_e2,linear algebra,matrices,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_matrices_e3,linear algebra,matrices,A,1.0,0.95,A,0.9,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_matrices_m1,linear algebra,matrices,A,0.0,0.95,B,0.95,A,0.98,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_matrices_m2,linear algebra,matrices,A,0.0,1.0,B,0.95,A,0.95,B,0.9,A
Open-Reasoner-Zero-7B,linearalgebra_matrices_m3,linear algebra,matrices,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_matrices_h1,linear algebra,matrices,B,1.0,0.95,B,0.95,B,0.95,B,0.8,A
Open-Reasoner-Zero-7B,linearalgebra_matrices_h2,linear algebra,matrices,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_matrices_h3,linear algebra,matrices,A,1.0,0.95,A,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_determinants_e1,linear algebra,determinants,A,0.0,1.0,B,0.85,B,0.95,B,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_determinants_e2,linear algebra,determinants,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_determinants_e3,linear algebra,determinants,A,0.0,1.0,B,0.85,B,0.95,A,0.85,A
Open-Reasoner-Zero-7B,linearalgebra_determinants_m1,linear algebra,determinants,B,1.0,0.95,B,0.85,B,0.95,A,1.0,B
Open-Reasoner-Zero-7B,linearalgebra_determinants_m2,linear algebra,determinants,A,1.0,1.0,B,0.75,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_determinants_m3,linear algebra,determinants,A,1.0,1.0,A,0.65,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_determinants_h1,linear algebra,determinants,A,0.0,0.95,B,0.95,A,0.95,B,0.7,A
Open-Reasoner-Zero-7B,linearalgebra_determinants_h2,linear algebra,determinants,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_determinants_h3,linear algebra,determinants,A,1.0,1.0,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,A,1.0,1.0,A,0.85,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,A,0.0,0.95,B,0.8,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,A,0.0,0.85,B,0.85,A,0.98,B,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,0.0,0.95,B,0.85,A,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,A,0.0,0.95,B,0.85,A,0.99,B,1.0,A
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,1.0,0.95,A,0.85,A,0.95,B,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,B,1.0,0.95,B,0.85,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,0.0,0.95,B,0.95,A,0.95,B,1.0,A
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,A,1.0,0.95,B,0.95,A,0.98,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,1.0,1.0,A,0.6,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,A,0.0,0.95,B,0.75,B,0.9,B,0.9,B
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,A,1.0,0.95,B,0.9,A,0.95,A,0.85,A
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.98,,,A
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,A,1.0,0.95,B,0.51,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_transformations_e1,linear algebra,linear transformations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_transformations_e2,linear algebra,linear transformations,A,1.0,0.95,A,0.85,A,0.95,A,1.0,B
Open-Reasoner-Zero-7B,linearalgebra_transformations_e3,linear algebra,linear transformations,A,0.0,1.0,B,0.9,B,0.98,B,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_transformations_m1,linear algebra,linear transformations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
Open-Reasoner-Zero-7B,linearalgebra_transformations_m2,linear algebra,linear transformations,A,1.0,1.0,A,0.8,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_transformations_m3,linear algebra,linear transformations,A,1.0,0.95,A,0.6,A,0.98,A,0.95,B
Open-Reasoner-Zero-7B,linearalgebra_transformations_h1,linear algebra,linear transformations,A,0.0,1.0,B,0.9,B,0.95,,,B
Open-Reasoner-Zero-7B,linearalgebra_transformations_h2,linear algebra,linear transformations,A,0.0,0.95,B,0.95,B,0.9,B,0.8,B
Open-Reasoner-Zero-7B,linearalgebra_transformations_h3,linear algebra,linear transformations,A,1.0,1.0,B,0.9,A,0.95,A,0.95,A
s1.1-7B,arithmetic_basic_operations_e1,arithmetic,basic operations,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_basic_operations_e2,arithmetic,basic operations,B,1.0,0.95,B,0.95,B,0.92,B,0.95,A
s1.1-7B,arithmetic_basic_operations_e3,arithmetic,basic operations,B,0.0,0.9,A,0.95,A,0.98,A,0.95,B
s1.1-7B,arithmetic_basic_operations_m1,arithmetic,basic operations,B,1.0,0.95,B,0.9,B,0.95,B,0.95,A
s1.1-7B,arithmetic_basic_operations_m2,arithmetic,basic operations,A,1.0,0.95,A,0.85,B,0.92,A,0.95,B
s1.1-7B,arithmetic_basic_operations_m3,arithmetic,basic operations,A,0.0,0.95,B,0.95,B,0.92,B,0.95,A
s1.1-7B,arithmetic_basic_operations_h1,arithmetic,basic operations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
s1.1-7B,arithmetic_basic_operations_h2,arithmetic,basic operations,B,0.0,0.85,A,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_basic_operations_h3,arithmetic,basic operations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,arithmetic_fractions_e1,arithmetic,fractions,B,0.0,0.95,B,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_fractions_e2,arithmetic,fractions,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
s1.1-7B,arithmetic_fractions_e3,arithmetic,fractions,B,0.0,0.85,A,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_fractions_m1,arithmetic,fractions,A,0.0,0.85,B,0.8,B,0.95,A,0.95,B
s1.1-7B,arithmetic_fractions_m2,arithmetic,fractions,A,1.0,0.95,B,0.75,A,0.95,A,0.95,B
s1.1-7B,arithmetic_fractions_m3,arithmetic,fractions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_fractions_h1,arithmetic,fractions,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_fractions_h2,arithmetic,fractions,A,1.0,0.95,A,0.85,A,0.9,A,0.95,A
s1.1-7B,arithmetic_fractions_h3,arithmetic,fractions,A,0.0,0.95,B,1.0,B,0.95,B,1.0,B
s1.1-7B,arithmetic_percentages_e1,arithmetic,percentages,A,0.0,0.9,B,0.95,B,0.95,B,1.0,A
s1.1-7B,arithmetic_percentages_e2,arithmetic,percentages,B,1.0,0.95,B,0.95,B,0.95,A,0.95,A
s1.1-7B,arithmetic_percentages_e3,arithmetic,percentages,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
s1.1-7B,arithmetic_percentages_m1,arithmetic,percentages,A,0.0,0.95,B,0.95,B,0.98,B,0.95,B
s1.1-7B,arithmetic_percentages_m2,arithmetic,percentages,A,1.0,0.85,B,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_percentages_m3,arithmetic,percentages,A,1.0,0.95,A,0.9,A,0.95,A,0.95,B
s1.1-7B,arithmetic_percentages_h1,arithmetic,percentages,A,1.0,0.9,A,0.9,B,0.95,A,0.95,A
s1.1-7B,arithmetic_percentages_h2,arithmetic,percentages,A,0.0,0.92,B,0.95,B,0.85,B,1.0,A
s1.1-7B,arithmetic_percentages_h3,arithmetic,percentages,A,1.0,0.95,A,1.0,A,0.95,A,1.0,A
s1.1-7B,arithmetic_numerical_e1,arithmetic,numerical approximation,A,0.0,0.95,B,0.95,B,0.98,A,0.95,B
s1.1-7B,arithmetic_numerical_e2,arithmetic,numerical approximation,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,arithmetic_numerical_e3,arithmetic,numerical approximation,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,arithmetic_numerical_m1,arithmetic,numerical approximation,B,1.0,0.85,A,0.85,B,0.92,B,0.95,B
s1.1-7B,arithmetic_numerical_m2,arithmetic,numerical approximation,B,1.0,0.85,B,0.85,B,0.95,A,0.95,A
s1.1-7B,arithmetic_numerical_m3,arithmetic,numerical approximation,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_numerical_h1,arithmetic,numerical approximation,A,0.0,0.85,B,0.85,B,0.9,A,0.9,A
s1.1-7B,arithmetic_numerical_h2,arithmetic,numerical approximation,A,0.0,0.95,B,0.65,A,0.75,B,0.9,A
s1.1-7B,arithmetic_numerical_h3,arithmetic,numerical approximation,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
s1.1-7B,arithmetic_order_e1,arithmetic,order of operations,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
s1.1-7B,arithmetic_order_e2,arithmetic,order of operations,A,1.0,0.95,A,0.9,B,0.95,A,0.95,A
s1.1-7B,arithmetic_order_e3,arithmetic,order of operations,A,0.0,0.85,B,0.95,B,0.98,B,0.95,B
s1.1-7B,arithmetic_order_m1,arithmetic,order of operations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,arithmetic_order_m2,arithmetic,order of operations,A,1.0,0.95,A,0.95,B,0.95,A,0.95,A
s1.1-7B,arithmetic_order_m3,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,arithmetic_order_h1,arithmetic,order of operations,A,0.0,0.95,B,0.95,B,0.95,B,0.9,B
s1.1-7B,arithmetic_order_h2,arithmetic,order of operations,A,0.0,0.95,B,0.85,B,0.95,A,1.0,B
s1.1-7B,arithmetic_order_h3,arithmetic,order of operations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
s1.1-7B,algebra_equations_e1,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,algebra_equations_e2,algebra,equations,B,1.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,algebra_equations_e3,algebra,equations,A,1.0,0.95,A,0.95,A,0.98,A,1.0,B
s1.1-7B,algebra_equations_m1,algebra,equations,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
s1.1-7B,algebra_equations_m2,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
s1.1-7B,algebra_equations_m3,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,algebra_equations_h1,algebra,equations,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
s1.1-7B,algebra_equations_h2,algebra,equations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
s1.1-7B,algebra_equations_h3,algebra,equations,A,0.0,0.55,B,0.75,B,0.65,A,0.75,A
s1.1-7B,algebra_inequalities_e1,algebra,inequalities,B,1.0,0.95,B,0.95,B,0.98,A,0.95,B
s1.1-7B,algebra_inequalities_e2,algebra,inequalities,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,algebra_inequalities_e3,algebra,inequalities,A,1.0,0.85,A,0.6,A,0.95,A,0.95,A
s1.1-7B,algebra_inequalities_m1,algebra,inequalities,A,1.0,0.85,B,0.9,A,0.95,A,0.95,A
s1.1-7B,algebra_inequalities_m2,algebra,inequalities,A,1.0,0.95,A,0.95,A,0.95,B,0.9,A
s1.1-7B,algebra_inequalities_m3,algebra,inequalities,B,1.0,0.85,B,0.95,B,0.95,B,0.95,A
s1.1-7B,algebra_inequalities_h1,algebra,inequalities,B,1.0,0.95,B,0.85,B,0.95,A,0.95,A
s1.1-7B,algebra_inequalities_h2,algebra,inequalities,B,1.0,0.92,B,0.95,B,0.98,B,0.95,B
s1.1-7B,algebra_inequalities_h3,algebra,inequalities,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
s1.1-7B,algebra_polynomials_e1,algebra,polynomials,B,1.0,0.95,B,0.98,B,0.98,B,0.95,B
s1.1-7B,algebra_polynomials_e2,algebra,polynomials,B,0.0,0.85,A,0.95,A,0.95,B,0.95,A
s1.1-7B,algebra_polynomials_e3,algebra,polynomials,A,0.0,0.95,B,0.65,A,0.95,B,0.9,A
s1.1-7B,algebra_polynomials_m1,algebra,polynomials,B,1.0,0.95,B,0.85,B,0.95,B,0.95,B
s1.1-7B,algebra_polynomials_m2,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,algebra_polynomials_m3,algebra,polynomials,B,1.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,algebra_polynomials_h1,algebra,polynomials,A,1.0,0.95,A,0.95,A,0.98,A,0.95,A
s1.1-7B,algebra_polynomials_h2,algebra,polynomials,A,0.0,0.85,B,0.95,B,0.98,B,0.95,B
s1.1-7B,algebra_polynomials_h3,algebra,polynomials,B,1.0,0.75,A,0.75,B,0.9,B,0.95,A
s1.1-7B,algebra_functions_e1,algebra,functions,A,0.0,0.95,B,0.95,B,0.95,A,1.0,B
s1.1-7B,algebra_functions_e2,algebra,functions,B,1.0,0.95,B,0.9,A,0.92,B,0.85,A
s1.1-7B,algebra_functions_e3,algebra,functions,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
s1.1-7B,algebra_functions_m1,algebra,functions,A,1.0,1.0,A,0.7,B,0.92,A,0.95,A
s1.1-7B,algebra_functions_m2,algebra,functions,B,1.0,0.95,A,0.7,B,0.95,B,1.0,A
s1.1-7B,algebra_functions_m3,algebra,functions,A,0.0,0.95,B,0.85,B,0.95,A,0.95,A
s1.1-7B,algebra_functions_h1,algebra,functions,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,algebra_functions_h2,algebra,functions,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
s1.1-7B,algebra_functions_h3,algebra,functions,A,1.0,0.85,A,0.95,A,0.95,A,0.95,B
s1.1-7B,algebra_systems_e1,algebra,systems of equations,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,algebra_systems_e2,algebra,systems of equations,B,1.0,0.95,B,0.95,B,0.95,B,0.9,B
s1.1-7B,algebra_systems_e3,algebra,systems of equations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,algebra_systems_m1,algebra,systems of equations,B,0.0,0.85,A,0.95,A,0.95,A,0.95,B
s1.1-7B,algebra_systems_m2,algebra,systems of equations,A,0.0,0.95,B,1.0,B,0.95,B,0.95,B
s1.1-7B,algebra_systems_m3,algebra,systems of equations,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
s1.1-7B,algebra_systems_h1,algebra,systems of equations,B,1.0,0.95,B,0.9,B,0.85,B,0.95,A
s1.1-7B,algebra_systems_h2,algebra,systems of equations,A,0.0,0.9,B,0.95,B,0.95,B,0.95,A
s1.1-7B,algebra_systems_h3,algebra,systems of equations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
s1.1-7B,calculus_differentiation_e1,calculus,differentiation,A,0.0,0.95,B,0.92,A,0.95,B,0.95,A
s1.1-7B,calculus_differentiation_e2,calculus,differentiation,B,0.0,0.95,A,0.95,A,0.95,B,0.95,A
s1.1-7B,calculus_differentiation_e3,calculus,differentiation,A,0.0,0.85,B,0.9,B,0.95,B,0.95,B
s1.1-7B,calculus_differentiation_m1,calculus,differentiation,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
s1.1-7B,calculus_differentiation_m2,calculus,differentiation,B,0.0,0.9,A,0.95,A,0.95,A,0.95,A
s1.1-7B,calculus_differentiation_m3,calculus,differentiation,B,1.0,0.85,B,0.99,B,0.95,B,0.95,A
s1.1-7B,calculus_differentiation_h1,calculus,differentiation,B,1.0,0.95,B,1.0,B,0.95,B,0.95,B
s1.1-7B,calculus_differentiation_h2,calculus,differentiation,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
s1.1-7B,calculus_differentiation_h3,calculus,differentiation,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
s1.1-7B,calculus_integration_e1,calculus,integration,B,1.0,0.95,B,0.95,B,0.95,A,0.95,A
s1.1-7B,calculus_integration_e2,calculus,integration,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
s1.1-7B,calculus_integration_e3,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,calculus_integration_m1,calculus,integration,A,0.0,0.95,B,0.85,A,0.95,B,0.95,B
s1.1-7B,calculus_integration_m2,calculus,integration,A,1.0,0.95,A,0.95,A,0.98,A,0.95,B
s1.1-7B,calculus_integration_m3,calculus,integration,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,calculus_integration_h1,calculus,integration,B,1.0,0.9,B,0.98,B,0.98,B,1.0,A
s1.1-7B,calculus_integration_h2,calculus,integration,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
s1.1-7B,calculus_integration_h3,calculus,integration,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
s1.1-7B,calculus_limits_e1,calculus,limits,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
s1.1-7B,calculus_limits_e2,calculus,limits,A,1.0,0.95,B,0.85,A,0.98,A,0.95,B
s1.1-7B,calculus_limits_e3,calculus,limits,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
s1.1-7B,calculus_limits_m1,calculus,limits,A,0.0,0.95,B,0.85,B,0.95,A,0.95,A
s1.1-7B,calculus_limits_m2,calculus,limits,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,calculus_limits_m3,calculus,limits,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,calculus_limits_h1,calculus,limits,A,1.0,0.95,A,1.0,A,0.95,A,1.0,B
s1.1-7B,calculus_limits_h2,calculus,limits,A,0.0,0.95,B,0.85,A,0.98,B,0.95,B
s1.1-7B,calculus_limits_h3,calculus,limits,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,calculus_series_e1,calculus,series,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
s1.1-7B,calculus_series_e2,calculus,series,A,1.0,0.95,B,0.9,A,0.92,A,0.95,B
s1.1-7B,calculus_series_e3,calculus,series,B,0.0,0.85,A,0.85,A,0.95,A,0.95,A
s1.1-7B,calculus_series_m1,calculus,series,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
s1.1-7B,calculus_series_m2,calculus,series,A,1.0,0.95,A,0.95,A,0.98,A,0.95,A
s1.1-7B,calculus_series_m3,calculus,series,B,1.0,0.9,B,0.95,B,0.95,B,0.95,B
s1.1-7B,calculus_series_h1,calculus,series,A,1.0,1.0,A,0.95,B,0.95,A,0.95,B
s1.1-7B,calculus_series_h2,calculus,series,A,0.0,0.92,B,0.95,B,0.95,B,0.95,A
s1.1-7B,calculus_series_h3,calculus,series,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
s1.1-7B,calculus_applications_e1,calculus,applications,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
s1.1-7B,calculus_applications_e2,calculus,applications,B,0.0,0.98,B,0.85,A,0.95,A,0.95,A
s1.1-7B,calculus_applications_e3,calculus,applications,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,calculus_applications_m1,calculus,applications,A,1.0,0.85,A,0.9,A,0.95,A,0.95,A
s1.1-7B,calculus_applications_m2,calculus,applications,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,calculus_applications_m3,calculus,applications,A,1.0,0.8,A,0.9,A,0.95,A,0.95,A
s1.1-7B,calculus_applications_h1,calculus,applications,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,calculus_applications_h2,calculus,applications,A,0.0,0.95,B,0.75,B,0.95,B,0.95,B
s1.1-7B,calculus_applications_h3,calculus,applications,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
s1.1-7B,geometry_plane_e1,geometry,plane geometry,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,geometry_plane_e2,geometry,plane geometry,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
s1.1-7B,geometry_plane_e3,geometry,plane geometry,A,0.0,0.85,B,0.95,B,0.95,A,0.95,B
s1.1-7B,geometry_plane_m1,geometry,plane geometry,A,0.0,0.95,B,0.98,B,0.98,B,0.95,B
s1.1-7B,geometry_plane_m2,geometry,plane geometry,B,1.0,0.85,B,0.95,B,0.95,B,1.0,B
s1.1-7B,geometry_plane_m3,geometry,plane geometry,A,0.0,0.95,B,1.0,B,0.98,B,0.95,B
s1.1-7B,geometry_plane_h1,geometry,plane geometry,B,1.0,0.95,B,0.85,B,0.95,A,0.95,A
s1.1-7B,geometry_plane_h2,geometry,plane geometry,B,1.0,0.95,B,0.98,B,0.98,B,0.95,B
s1.1-7B,geometry_plane_h3,geometry,plane geometry,B,1.0,0.95,B,0.95,B,0.98,B,0.95,B
s1.1-7B,geometry_coordinate_e1,geometry,coordinate geometry,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,geometry_coordinate_e2,geometry,coordinate geometry,B,0.0,1.0,A,0.95,A,0.95,B,0.95,A
s1.1-7B,geometry_coordinate_e3,geometry,coordinate geometry,A,1.0,0.95,A,0.95,B,0.92,A,0.95,B
s1.1-7B,geometry_coordinate_m1,geometry,coordinate geometry,A,1.0,0.95,B,0.95,A,0.92,A,0.95,A
s1.1-7B,geometry_coordinate_m2,geometry,coordinate geometry,B,1.0,0.95,B,1.0,B,0.95,B,0.95,B
s1.1-7B,geometry_coordinate_m3,geometry,coordinate geometry,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
s1.1-7B,geometry_coordinate_h1,geometry,coordinate geometry,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,geometry_coordinate_h2,geometry,coordinate geometry,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
s1.1-7B,geometry_coordinate_h3,geometry,coordinate geometry,B,1.0,0.95,B,1.0,B,0.98,B,0.95,B
s1.1-7B,geometry_transformations_e1,geometry,transformations,A,1.0,0.9,A,0.9,A,0.92,A,0.95,A
s1.1-7B,geometry_transformations_e2,geometry,transformations,A,0.0,0.95,B,0.85,B,0.92,B,0.95,B
s1.1-7B,geometry_transformations_e3,geometry,transformations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
s1.1-7B,geometry_transformations_m1,geometry,transformations,A,0.0,0.85,A,0.95,B,0.85,B,0.95,A
s1.1-7B,geometry_transformations_m2,geometry,transformations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
s1.1-7B,geometry_transformations_m3,geometry,transformations,B,1.0,0.95,B,0.95,B,0.92,B,0.95,B
s1.1-7B,geometry_transformations_h1,geometry,transformations,B,0.0,0.95,A,0.85,B,0.95,A,0.95,A
s1.1-7B,geometry_transformations_h2,geometry,transformations,A,1.0,0.95,A,0.95,A,0.85,A,0.9,B
s1.1-7B,geometry_transformations_h3,geometry,transformations,B,1.0,0.95,B,0.6,B,0.75,B,0.8,B
s1.1-7B,geometry_mensuration_e1,geometry,mensuration,B,1.0,0.95,B,1.0,B,0.98,B,0.95,B
s1.1-7B,geometry_mensuration_e2,geometry,mensuration,B,0.0,0.95,A,0.85,A,0.98,A,0.95,A
s1.1-7B,geometry_mensuration_e3,geometry,mensuration,B,0.0,0.95,A,0.85,B,0.92,A,0.95,A
s1.1-7B,geometry_mensuration_m1,geometry,mensuration,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,geometry_mensuration_m2,geometry,mensuration,B,1.0,0.85,B,1.0,B,0.98,B,0.95,B
s1.1-7B,geometry_mensuration_m3,geometry,mensuration,B,0.0,0.95,A,0.95,A,0.92,A,0.95,A
s1.1-7B,geometry_mensuration_h1,geometry,mensuration,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
s1.1-7B,geometry_mensuration_h2,geometry,mensuration,B,1.0,0.85,B,0.65,B,0.85,B,0.75,B
s1.1-7B,geometry_mensuration_h3,geometry,mensuration,A,0.0,0.75,B,0.85,B,0.85,A,0.9,B
s1.1-7B,geometry_trigonometry_e1,geometry,trigonometry,A,1.0,0.95,A,0.95,A,0.9,A,0.95,A
s1.1-7B,geometry_trigonometry_e2,geometry,trigonometry,A,1.0,0.95,A,0.85,A,0.9,A,0.95,A
s1.1-7B,geometry_trigonometry_e3,geometry,trigonometry,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
s1.1-7B,geometry_trigonometry_m1,geometry,trigonometry,A,0.0,0.85,B,1.0,B,0.95,B,1.0,A
s1.1-7B,geometry_trigonometry_m2,geometry,trigonometry,B,0.0,0.95,A,1.0,A,0.95,A,0.95,A
s1.1-7B,geometry_trigonometry_m3,geometry,trigonometry,A,1.0,0.95,A,0.9,A,0.92,A,0.95,A
s1.1-7B,geometry_trigonometry_h1,geometry,trigonometry,A,0.0,0.95,A,0.85,B,0.95,B,0.95,A
s1.1-7B,geometry_trigonometry_h2,geometry,trigonometry,A,0.0,0.85,B,0.95,B,0.95,B,0.95,A
s1.1-7B,geometry_trigonometry_h3,geometry,trigonometry,A,0.0,0.95,B,0.95,B,0.95,,,B
s1.1-7B,numbertheory_divisibility_e1,number theory,divisibility,A,1.0,0.9,A,0.95,A,0.95,B,0.95,A
s1.1-7B,numbertheory_divisibility_e2,number theory,divisibility,A,0.0,0.9,B,0.85,B,0.95,A,0.95,A
s1.1-7B,numbertheory_divisibility_e3,number theory,divisibility,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
s1.1-7B,numbertheory_divisibility_m1,number theory,divisibility,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,numbertheory_divisibility_m2,number theory,divisibility,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_divisibility_m3,number theory,divisibility,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_divisibility_h1,number theory,divisibility,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
s1.1-7B,numbertheory_divisibility_h2,number theory,divisibility,B,0.0,0.92,A,0.85,A,0.95,A,0.95,B
s1.1-7B,numbertheory_divisibility_h3,number theory,divisibility,A,0.0,0.85,B,0.98,B,0.98,B,1.0,B
s1.1-7B,numbertheory_modular_e1,number theory,modular arithmetic,A,1.0,0.85,A,0.98,A,0.95,A,0.95,A
s1.1-7B,numbertheory_modular_e2,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,numbertheory_modular_e3,number theory,modular arithmetic,A,0.0,0.9,B,0.85,B,0.95,A,0.95,A
s1.1-7B,numbertheory_modular_m1,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.95,A,0.9,A
s1.1-7B,numbertheory_modular_m2,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.95,A,1.0,B
s1.1-7B,numbertheory_modular_m3,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.98,A,0.95,B
s1.1-7B,numbertheory_modular_h1,number theory,modular arithmetic,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_modular_h2,number theory,modular arithmetic,A,0.0,0.95,B,0.95,B,0.85,B,0.95,B
s1.1-7B,numbertheory_modular_h3,number theory,modular arithmetic,A,0.0,0.85,B,0.9,B,0.95,A,0.95,B
s1.1-7B,numbertheory_primes_e1,number theory,primes,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
s1.1-7B,numbertheory_primes_e2,number theory,primes,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
s1.1-7B,numbertheory_primes_e3,number theory,primes,B,0.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_primes_m1,number theory,primes,B,0.0,0.85,B,0.75,A,0.9,A,0.9,A
s1.1-7B,numbertheory_primes_m2,number theory,primes,A,1.0,0.95,A,1.0,A,0.98,A,0.95,A
s1.1-7B,numbertheory_primes_m3,number theory,primes,A,1.0,0.85,A,0.98,A,0.95,A,0.95,A
s1.1-7B,numbertheory_primes_h1,number theory,primes,A,1.0,0.85,A,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_primes_h2,number theory,primes,A,1.0,0.95,B,0.95,A,0.95,A,0.95,B
s1.1-7B,numbertheory_primes_h3,number theory,primes,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
s1.1-7B,numbertheory_diophantine_e1,number theory,diophantine equations,A,1.0,0.95,B,0.95,A,0.98,A,0.95,B
s1.1-7B,numbertheory_diophantine_e2,number theory,diophantine equations,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
s1.1-7B,numbertheory_diophantine_e3,number theory,diophantine equations,A,1.0,0.85,A,0.85,A,0.95,A,0.95,B
s1.1-7B,numbertheory_diophantine_m1,number theory,diophantine equations,B,0.0,0.85,A,0.9,A,0.95,A,0.95,A
s1.1-7B,numbertheory_diophantine_m2,number theory,diophantine equations,A,1.0,0.95,B,0.85,A,0.95,A,0.95,B
s1.1-7B,numbertheory_diophantine_m3,number theory,diophantine equations,A,1.0,0.95,B,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_diophantine_h1,number theory,diophantine equations,B,1.0,0.9,B,0.95,B,0.98,B,0.95,A
s1.1-7B,numbertheory_diophantine_h2,number theory,diophantine equations,B,0.0,0.95,A,0.75,A,0.92,B,0.95,B
s1.1-7B,numbertheory_diophantine_h3,number theory,diophantine equations,A,0.0,0.65,B,0.8,B,0.65,B,0.85,B
s1.1-7B,numbertheory_sequences_e1,number theory,number sequences,B,0.0,0.85,B,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_sequences_e2,number theory,number sequences,A,1.0,0.95,A,0.95,A,0.95,B,0.9,A
s1.1-7B,numbertheory_sequences_e3,number theory,number sequences,B,1.0,0.95,B,1.0,B,0.95,B,0.95,B
s1.1-7B,numbertheory_sequences_m1,number theory,number sequences,A,0.0,0.95,B,0.85,B,0.95,A,0.95,B
s1.1-7B,numbertheory_sequences_m2,number theory,number sequences,A,0.0,0.95,B,0.9,B,0.95,B,0.95,B
s1.1-7B,numbertheory_sequences_m3,number theory,number sequences,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,numbertheory_sequences_h1,number theory,number sequences,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
s1.1-7B,numbertheory_sequences_h2,number theory,number sequences,A,1.0,0.95,B,0.9,A,0.95,A,0.95,A
s1.1-7B,numbertheory_sequences_h3,number theory,number sequences,A,1.0,0.85,A,0.98,A,0.95,A,0.95,A
s1.1-7B,combinatorics_counting_e1,combinatorics,counting principles,A,0.0,0.9,B,0.85,B,0.95,B,0.95,A
s1.1-7B,combinatorics_counting_e2,combinatorics,counting principles,A,0.0,0.95,B,0.95,B,0.95,B,0.9,B
s1.1-7B,combinatorics_counting_e3,combinatorics,counting principles,A,1.0,0.95,A,0.85,A,0.92,A,0.95,A
s1.1-7B,combinatorics_counting_m1,combinatorics,counting principles,B,0.0,0.85,A,0.95,A,0.95,A,0.95,A
s1.1-7B,combinatorics_counting_m2,combinatorics,counting principles,A,1.0,0.9,A,0.85,B,0.95,A,0.95,A
s1.1-7B,combinatorics_counting_m3,combinatorics,counting principles,B,1.0,0.95,B,0.95,B,0.98,B,0.95,B
s1.1-7B,combinatorics_counting_h1,combinatorics,counting principles,B,1.0,0.9,B,0.99,B,0.95,B,0.95,A
s1.1-7B,combinatorics_counting_h2,combinatorics,counting principles,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,combinatorics_counting_h3,combinatorics,counting principles,B,1.0,0.95,B,0.98,B,0.95,B,1.0,B
s1.1-7B,combinatorics_permutations_e1,combinatorics,permutations,A,0.0,0.95,A,0.85,B,0.95,B,0.95,B
s1.1-7B,combinatorics_permutations_e2,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.98,A,0.95,A
s1.1-7B,combinatorics_permutations_e3,combinatorics,permutations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,combinatorics_permutations_m1,combinatorics,permutations,A,0.0,0.95,B,0.9,A,0.95,B,0.95,A
s1.1-7B,combinatorics_permutations_m2,combinatorics,permutations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,combinatorics_permutations_m3,combinatorics,permutations,A,1.0,0.95,A,0.85,A,0.95,A,1.0,A
s1.1-7B,combinatorics_permutations_h1,combinatorics,permutations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,combinatorics_permutations_h2,combinatorics,permutations,A,1.0,0.95,B,0.9,A,0.98,A,0.95,B
s1.1-7B,combinatorics_permutations_h3,combinatorics,permutations,B,1.0,0.85,B,0.85,A,0.85,B,0.6,A
s1.1-7B,combinatorics_combinations_e1,combinatorics,combinations,A,0.0,0.95,B,0.98,B,0.95,A,0.9,B
s1.1-7B,combinatorics_combinations_e2,combinatorics,combinations,B,1.0,0.95,B,0.9,B,0.98,B,0.95,A
s1.1-7B,combinatorics_combinations_e3,combinatorics,combinations,A,1.0,0.95,A,0.85,A,0.95,B,0.9,B
s1.1-7B,combinatorics_combinations_m1,combinatorics,combinations,A,1.0,0.95,A,0.85,A,0.95,A,0.95,A
s1.1-7B,combinatorics_combinations_m2,combinatorics,combinations,B,0.0,0.85,A,0.95,A,0.95,A,0.95,B
s1.1-7B,combinatorics_combinations_m3,combinatorics,combinations,A,1.0,0.95,A,0.98,A,0.98,A,0.95,A
s1.1-7B,combinatorics_combinations_h1,combinatorics,combinations,A,1.0,0.95,A,0.95,A,0.95,A,1.0,A
s1.1-7B,combinatorics_combinations_h2,combinatorics,combinations,B,1.0,0.95,B,1.0,B,0.98,B,1.0,B
s1.1-7B,combinatorics_combinations_h3,combinatorics,combinations,B,1.0,0.85,B,0.85,B,0.95,B,0.95,B
s1.1-7B,combinatorics_probability_e1,combinatorics,probability,A,1.0,0.95,A,0.95,A,0.98,A,0.95,A
s1.1-7B,combinatorics_probability_e2,combinatorics,probability,A,0.0,0.85,B,0.95,B,0.95,B,0.95,B
s1.1-7B,combinatorics_probability_e3,combinatorics,probability,A,1.0,0.95,A,0.85,B,0.92,A,0.95,A
s1.1-7B,combinatorics_probability_m1,combinatorics,probability,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
s1.1-7B,combinatorics_probability_m2,combinatorics,probability,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,combinatorics_probability_m3,combinatorics,probability,A,1.0,0.95,A,1.0,A,0.95,A,1.0,A
s1.1-7B,combinatorics_probability_h1,combinatorics,probability,A,0.0,0.95,B,0.98,A,0.95,,,A
s1.1-7B,combinatorics_probability_h2,combinatorics,probability,A,0.0,0.95,B,0.85,B,0.95,B,0.95,B
s1.1-7B,combinatorics_probability_h3,combinatorics,probability,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
s1.1-7B,combinatorics_recursion_e1,combinatorics,recursion,A,1.0,0.95,A,0.95,A,0.98,B,0.9,A
s1.1-7B,combinatorics_recursion_e2,combinatorics,recursion,B,1.0,0.9,B,0.95,B,0.98,B,0.95,B
s1.1-7B,combinatorics_recursion_e3,combinatorics,recursion,A,1.0,0.85,A,0.95,A,1.0,A,0.95,B
s1.1-7B,combinatorics_recursion_m1,combinatorics,recursion,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,combinatorics_recursion_m2,combinatorics,recursion,A,1.0,0.95,A,0.8,A,0.98,A,1.0,B
s1.1-7B,combinatorics_recursion_m3,combinatorics,recursion,A,1.0,0.9,A,0.8,B,0.85,A,0.9,A
s1.1-7B,combinatorics_recursion_h1,combinatorics,recursion,A,1.0,0.95,A,1.0,A,0.98,A,1.0,A
s1.1-7B,combinatorics_recursion_h2,combinatorics,recursion,B,0.0,0.95,A,0.9,B,0.92,A,0.95,B
s1.1-7B,combinatorics_recursion_h3,combinatorics,recursion,B,1.0,0.85,B,0.95,B,0.95,A,0.95,A
s1.1-7B,statistics_descriptive_e1,statistics,descriptive statistics,B,0.0,0.85,B,0.85,A,0.95,A,0.95,A
s1.1-7B,statistics_descriptive_e2,statistics,descriptive statistics,A,1.0,0.95,A,0.95,A,0.95,B,0.95,B
s1.1-7B,statistics_descriptive_e3,statistics,descriptive statistics,A,1.0,0.95,A,0.95,A,0.98,A,0.95,A
s1.1-7B,statistics_descriptive_m1,statistics,descriptive statistics,A,1.0,0.9,A,0.95,A,0.92,A,0.95,B
s1.1-7B,statistics_descriptive_m2,statistics,descriptive statistics,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,statistics_descriptive_m3,statistics,descriptive statistics,B,1.0,0.95,B,0.98,B,0.85,B,0.95,B
s1.1-7B,statistics_descriptive_h1,statistics,descriptive statistics,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
s1.1-7B,statistics_descriptive_h2,statistics,descriptive statistics,B,0.0,0.95,A,0.95,B,0.75,,,B
s1.1-7B,statistics_descriptive_h3,statistics,descriptive statistics,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
s1.1-7B,statistics_distributions_e1,statistics,distributions,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,statistics_distributions_e2,statistics,distributions,A,0.0,0.95,B,0.95,A,0.95,B,0.95,A
s1.1-7B,statistics_distributions_e3,statistics,distributions,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,statistics_distributions_m1,statistics,distributions,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,statistics_distributions_m2,statistics,distributions,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,statistics_distributions_m3,statistics,distributions,A,1.0,1.0,A,0.95,A,0.98,A,0.95,A
s1.1-7B,statistics_distributions_h1,statistics,distributions,A,1.0,0.95,A,0.9,B,0.95,A,0.95,A
s1.1-7B,statistics_distributions_h2,statistics,distributions,A,1.0,0.95,B,0.85,A,0.95,A,0.95,A
s1.1-7B,statistics_distributions_h3,statistics,distributions,A,1.0,0.95,A,0.9,A,0.95,A,0.9,B
s1.1-7B,statistics_hypothesis_e1,statistics,hypothesis testing,B,0.0,0.85,A,0.9,A,0.95,A,0.95,A
s1.1-7B,statistics_hypothesis_e2,statistics,hypothesis testing,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
s1.1-7B,statistics_hypothesis_e3,statistics,hypothesis testing,A,1.0,0.9,A,0.85,A,0.9,A,0.95,B
s1.1-7B,statistics_hypothesis_m1,statistics,hypothesis testing,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
s1.1-7B,statistics_hypothesis_m2,statistics,hypothesis testing,A,1.0,0.95,A,0.98,A,0.95,A,0.95,A
s1.1-7B,statistics_hypothesis_m3,statistics,hypothesis testing,A,0.0,0.85,B,0.75,B,0.95,B,0.8,B
s1.1-7B,statistics_hypothesis_h1,statistics,hypothesis testing,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
s1.1-7B,statistics_hypothesis_h2,statistics,hypothesis testing,A,0.0,0.65,B,0.95,B,0.85,B,0.95,B
s1.1-7B,statistics_hypothesis_h3,statistics,hypothesis testing,A,1.0,0.95,A,0.99,A,0.98,A,1.0,A
s1.1-7B,statistics_regression_e1,statistics,regression,B,0.0,0.95,A,0.85,A,0.95,A,0.95,A
s1.1-7B,statistics_regression_e2,statistics,regression,A,1.0,0.95,A,0.98,A,0.95,A,0.95,B
s1.1-7B,statistics_regression_e3,statistics,regression,A,0.0,0.95,B,0.85,B,0.92,B,0.9,B
s1.1-7B,statistics_regression_m1,statistics,regression,B,0.0,0.92,A,0.85,A,0.95,,,A
s1.1-7B,statistics_regression_m2,statistics,regression,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,statistics_regression_m3,statistics,regression,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
s1.1-7B,statistics_regression_h1,statistics,regression,A,0.0,0.95,B,0.9,B,0.95,A,0.95,B
s1.1-7B,statistics_regression_h2,statistics,regression,B,1.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,statistics_regression_h3,statistics,regression,A,1.0,0.95,A,0.95,A,0.85,A,0.95,B
s1.1-7B,statistics_bayesian_e1,statistics,bayesian inference,A,1.0,0.9,A,0.95,A,0.95,A,0.95,A
s1.1-7B,statistics_bayesian_e2,statistics,bayesian inference,B,1.0,0.85,B,0.85,B,0.95,A,0.95,B
s1.1-7B,statistics_bayesian_e3,statistics,bayesian inference,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
s1.1-7B,statistics_bayesian_m1,statistics,bayesian inference,A,1.0,0.95,A,0.9,A,0.98,A,0.95,A
s1.1-7B,statistics_bayesian_m2,statistics,bayesian inference,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,statistics_bayesian_m3,statistics,bayesian inference,B,1.0,0.95,B,0.95,B,0.95,B,0.95,A
s1.1-7B,statistics_bayesian_h1,statistics,bayesian inference,A,1.0,0.95,B,0.8,A,0.85,A,0.95,A
s1.1-7B,statistics_bayesian_h2,statistics,bayesian inference,B,0.0,0.85,A,0.75,A,0.85,A,0.95,A
s1.1-7B,statistics_bayesian_h3,statistics,bayesian inference,B,1.0,0.9,B,0.95,B,0.95,A,0.85,A
s1.1-7B,linearalgebra_matrices_e1,linear algebra,matrices,A,1.0,0.95,B,0.95,A,0.95,A,0.95,B
s1.1-7B,linearalgebra_matrices_e2,linear algebra,matrices,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,linearalgebra_matrices_e3,linear algebra,matrices,A,1.0,0.85,A,0.95,A,0.95,B,0.95,B
s1.1-7B,linearalgebra_matrices_m1,linear algebra,matrices,A,0.0,0.95,B,0.65,B,0.95,A,0.95,A
s1.1-7B,linearalgebra_matrices_m2,linear algebra,matrices,B,1.0,0.95,B,0.95,A,0.95,B,0.95,A
s1.1-7B,linearalgebra_matrices_m3,linear algebra,matrices,A,1.0,0.95,A,0.85,B,0.9,A,0.95,A
s1.1-7B,linearalgebra_matrices_h1,linear algebra,matrices,A,0.0,0.95,B,0.85,B,0.95,A,0.95,A
s1.1-7B,linearalgebra_matrices_h2,linear algebra,matrices,A,1.0,0.95,A,0.9,A,0.95,A,0.95,A
s1.1-7B,linearalgebra_matrices_h3,linear algebra,matrices,A,1.0,0.95,A,0.95,A,0.95,B,0.95,A
s1.1-7B,linearalgebra_determinants_e1,linear algebra,determinants,A,0.0,0.95,B,0.95,B,0.95,A,0.95,B
s1.1-7B,linearalgebra_determinants_e2,linear algebra,determinants,A,1.0,0.95,A,0.95,A,0.95,A,0.95,B
s1.1-7B,linearalgebra_determinants_e3,linear algebra,determinants,A,0.0,0.9,B,0.95,B,0.95,B,0.95,B
s1.1-7B,linearalgebra_determinants_m1,linear algebra,determinants,B,0.0,0.95,A,0.85,A,0.95,A,0.95,B
s1.1-7B,linearalgebra_determinants_m2,linear algebra,determinants,B,0.0,0.95,A,0.95,A,0.98,A,0.95,A
s1.1-7B,linearalgebra_determinants_m3,linear algebra,determinants,A,1.0,0.95,A,0.9,A,0.98,A,1.0,A
s1.1-7B,linearalgebra_determinants_h1,linear algebra,determinants,Tie,0.5,0.5,B,1.0,B,0.95,B,0.95,A
s1.1-7B,linearalgebra_determinants_h2,linear algebra,determinants,B,1.0,0.85,B,0.95,B,0.95,B,0.95,B
s1.1-7B,linearalgebra_determinants_h3,linear algebra,determinants,B,0.0,0.9,A,0.95,A,0.95,A,0.95,B
s1.1-7B,linearalgebra_vectorspaces_e1,linear algebra,vector spaces,B,0.0,0.95,A,0.85,A,0.9,B,0.95,A
s1.1-7B,linearalgebra_vectorspaces_e2,linear algebra,vector spaces,A,0.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,linearalgebra_vectorspaces_e3,linear algebra,vector spaces,B,0.0,0.85,A,0.85,B,0.95,A,0.95,A
s1.1-7B,linearalgebra_vectorspaces_m1,linear algebra,vector spaces,A,0.0,0.85,B,0.9,B,0.95,B,1.0,B
s1.1-7B,linearalgebra_vectorspaces_m2,linear algebra,vector spaces,B,1.0,0.92,B,0.85,B,0.95,A,0.95,B
s1.1-7B,linearalgebra_vectorspaces_m3,linear algebra,vector spaces,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,linearalgebra_vectorspaces_h1,linear algebra,vector spaces,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,linearalgebra_vectorspaces_h2,linear algebra,vector spaces,A,1.0,0.95,A,0.85,A,0.95,A,0.95,B
s1.1-7B,linearalgebra_vectorspaces_h3,linear algebra,vector spaces,A,1.0,0.75,A,0.95,A,0.85,B,0.9,A
s1.1-7B,linearalgebra_eigenvalues_e1,linear algebra,eigenvalues,A,0.0,0.95,B,0.95,B,0.95,B,1.0,B
s1.1-7B,linearalgebra_eigenvalues_e2,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,B,0.95,A,0.95,B
s1.1-7B,linearalgebra_eigenvalues_e3,linear algebra,eigenvalues,B,1.0,0.85,B,0.98,B,0.98,A,0.95,A
s1.1-7B,linearalgebra_eigenvalues_m1,linear algebra,eigenvalues,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,linearalgebra_eigenvalues_m2,linear algebra,eigenvalues,B,1.0,0.95,B,0.65,B,0.9,A,0.9,B
s1.1-7B,linearalgebra_eigenvalues_m3,linear algebra,eigenvalues,B,1.0,0.85,B,0.9,B,0.95,A,0.95,B
s1.1-7B,linearalgebra_eigenvalues_h1,linear algebra,eigenvalues,B,0.0,0.95,B,0.85,A,0.95,A,0.95,A
s1.1-7B,linearalgebra_eigenvalues_h2,linear algebra,eigenvalues,A,1.0,0.85,B,0.85,A,0.9,A,0.95,A
s1.1-7B,linearalgebra_eigenvalues_h3,linear algebra,eigenvalues,B,1.0,0.95,B,0.98,B,0.98,B,1.0,A
s1.1-7B,linearalgebra_transformations_e1,linear algebra,linear transformations,A,0.0,0.95,B,0.9,B,0.95,A,0.95,A
s1.1-7B,linearalgebra_transformations_e2,linear algebra,linear transformations,A,1.0,0.95,A,0.95,A,0.95,A,0.95,A
s1.1-7B,linearalgebra_transformations_e3,linear algebra,linear transformations,A,0.0,0.95,B,0.95,B,0.95,B,0.95,A
s1.1-7B,linearalgebra_transformations_m1,linear algebra,linear transformations,B,1.0,0.95,B,0.95,B,0.95,B,0.95,B
s1.1-7B,linearalgebra_transformations_m2,linear algebra,linear transformations,A,1.0,0.95,A,1.0,A,0.95,A,0.95,A
s1.1-7B,linearalgebra_transformations_m3,linear algebra,linear transformations,A,1.0,0.95,B,0.85,A,0.98,A,0.95,B
s1.1-7B,linearalgebra_transformations_h1,linear algebra,linear transformations,A,0.0,0.95,B,0.95,B,0.95,,,B
s1.1-7B,linearalgebra_transformations_h2,linear algebra,linear transformations,B,1.0,0.9,B,0.95,A,0.95,B,0.95,A
s1.1-7B,linearalgebra_transformations_h3,linear algebra,linear transformations,B,1.0,0.95,B,0.95,B,0.92,B,0.95,A
