analysis_report: false
api_key: EMPTY
api_url: null
chat_template: null
dataset_args:
  gsm8k:
    dataset_id: modelscope/gsm8k
    description: GSM8K (Grade School Math 8K) is a dataset of grade school math problems,
      designed to evaluate the mathematical reasoning abilities of AI models.
    eval_split: test
    extra_params: {}
    few_shot_num: 4
    few_shot_random: false
    filters: null
    metric_list:
    - AverageAccuracy
    model_adapter: generation
    name: gsm8k
    output_types:
    - generation
    pretty_name: GSM8K
    prompt_template: 'Question: {query}

      Let''s think step by step

      Answer:'
    query_template: null
    subset_list:
    - main
    system_prompt: null
    tags:
    - Mathematics
    train_split: null
dataset_dir: /data/models/modelscope/datasets
dataset_hub: modelscope
datasets:
- gsm8k
debug: false
dry_run: false
eval_backend: Native
eval_batch_size: 1
eval_config: null
eval_type: checkpoint
generation_config:
  do_sample: false
  max_length: 2048
  max_new_tokens: 512
  temperature: 1.0
  top_k: 50
  top_p: 1.0
ignore_errors: false
judge_model_args: {}
judge_strategy: auto
judge_worker_num: 1
limit: 20
mem_cache: false
model: /data/models/llama3.2-3B/
model_args:
  precision: torch.float16
  revision: master
model_id: ''
model_task: text_generation
outputs: null
seed: 42
stage: all
stream: false
template_type: null
timeout: null
use_cache: null
work_dir: ./outputs/20250829_113512
