name: math
limit: 105
kwargs:
  dataset: hendrycks/math
  split: test
  dataset_config: null
  question_key: problem
  answer_key: solution
  system_prompt: 'Please reason step by step, and put your final answer within \boxed{}.'
  use_math_verify: true
  parse_mode: response
  per_category_limit: 15
  per_category_shuffle: true
  per_category_seed: 42
