model_path: /nvme/qa_test_models
resource_path: /nvme/qa_test_models/resource
log_path: /nvme/qa_test_models/autotest_model/log
eval_log_path: /nvme/qa_test_models/evaluation_report
benchmark_path: /nvme/qa_test_models/benchmark-reports
dataset_path: /nvme/qa_test_models/datasets/ShareGPT_V3_unfiltered_cleaned_split.json
prefix_dataset_path: /nvme/qa_test_models/datasets/prefix_cache_test.json
env_tag: h800

tp_config:
    Intern-S1: 8
    Qwen3-235B-A22B: 8
    Qwen3-235B-A22B-FP8: 4
    Qwen3-30B-A3B: 2
    Qwen3-32B: 2
    gpt-oss-120b: 2
    gpt-oss-120b-BF16: 4
    gpt-oss-20b-BF16: 2
    Qwen2.5-32B-Instruct: 2

turbomind_chat_model:
    tp:
        - internlm/Intern-S1
        - internlm/Intern-S1-mini
        - Qwen/Qwen3-0.6B-FP8
        - Qwen/Qwen3-1.7B-FP8
        - Qwen/Qwen3-4B-FP8
        - Qwen/Qwen3-8B-FP8
        - Qwen/Qwen3-14B-FP8
        - Qwen/Qwen3-235B-A22B
        - Qwen/Qwen3-235B-A22B-FP8
        - Qwen/Qwen3-30B-A3B
        - Qwen/Qwen3-30B-A3B-FP8
        - Qwen/Qwen3-32B
        - Qwen/Qwen3-32B-FP8
        - openai/gpt-oss-120b
        - openai/gpt-oss-20b

pytorch_chat_model:
    tp:
        - internlm/Intern-S1
        - internlm/Intern-S1-mini
        - Qwen/Qwen3-0.6B-FP8
        - Qwen/Qwen3-1.7B-FP8
        - Qwen/Qwen3-4B-FP8
        - Qwen/Qwen3-8B-FP8
        - Qwen/Qwen3-14B-FP8
        - Qwen/Qwen3-235B-A22B
        - Qwen/Qwen3-235B-A22B-FP8
        - Qwen/Qwen3-30B-A3B
        - Qwen/Qwen3-30B-A3B-FP8
        - Qwen/Qwen3-32B
        - Qwen/Qwen3-32B-FP8
        - unsloth/gpt-oss-120b-BF16
        - unsloth/gpt-oss-20b-BF16

turbomind_vl_model:
   tp:
        - internlm/Intern-S1
        - internlm/Intern-S1-mini

pytorch_vl_model:
   tp:
        - internlm/Intern-S1
        - internlm/Intern-S1-mini

turbomind_base_model:
    tp:
        - internlm/Intern-S1-mini
        - Qwen/Qwen3-4B-FP8
        - openai/gpt-oss-20b

pytorch_base_model:
    tp:
        - internlm/Intern-S1-mini
        - Qwen/Qwen3-4B-FP8
        - unsloth/gpt-oss-20b-BF16

turbomind_quantization:
    no_awq:
        - internlm/Intern-S1
        - internlm/Intern-S1-mini
        - Qwen/Qwen3-0.6B-FP8
        - Qwen/Qwen3-1.7B-FP8
        - Qwen/Qwen3-4B-FP8
        - Qwen/Qwen3-8B-FP8
        - Qwen/Qwen3-14B-FP8
        - Qwen/Qwen3-235B-A22B
        - Qwen/Qwen3-235B-A22B-FP8
        - Qwen/Qwen3-30B-A3B
        - Qwen/Qwen3-30B-A3B-FP8
        - Qwen/Qwen3-32B
        - Qwen/Qwen3-32B-FP8
        - openai/gpt-oss-120b
        - openai/gpt-oss-20b
    gptq:
        - empty
    no_kvint4:
        - internlm/Intern-S1
        - internlm/Intern-S1-mini
        - Qwen/Qwen3-0.6B-FP8
        - Qwen/Qwen3-1.7B-FP8
        - Qwen/Qwen3-4B-FP8
        - Qwen/Qwen3-8B-FP8
        - Qwen/Qwen3-14B-FP8
        - Qwen/Qwen3-235B-A22B
        - Qwen/Qwen3-235B-A22B-FP8
        - Qwen/Qwen3-30B-A3B
        - Qwen/Qwen3-30B-A3B-FP8
        - Qwen/Qwen3-32B
        - Qwen/Qwen3-32B-FP8
        - openai/gpt-oss-120b
        - openai/gpt-oss-20b
    no_kvint8:
        - empty

pytorch_quantization:
    awq:
        - empty
    w8a8:
        - empty
    no_kvint4:
        - internlm/Intern-S1
        - internlm/Intern-S1-mini
        - Qwen/Qwen3-0.6B-FP8
        - Qwen/Qwen3-1.7B-FP8
        - Qwen/Qwen3-4B-FP8
        - Qwen/Qwen3-8B-FP8
        - Qwen/Qwen3-14B-FP8
        - Qwen/Qwen3-235B-A22B
        - Qwen/Qwen3-235B-A22B-FP8
        - Qwen/Qwen3-30B-A3B
        - Qwen/Qwen3-30B-A3B-FP8
        - Qwen/Qwen3-32B
        - Qwen/Qwen3-32B-FP8
    no_kvint8:
        - empty


evaluate_model:
    - internlm/Intern-S1-mini
    - Qwen/Qwen3-0.6B-FP8
    - Qwen/Qwen3-1.7B-FP8
    - Qwen/Qwen3-4B-FP8
    - Qwen/Qwen3-8B-FP8
    - Qwen/Qwen3-14B-FP8
    - Qwen/Qwen3-32B
    - Qwen/Qwen3-32B-FP8
    - Qwen/Qwen3-30B-A3B
    - Qwen/Qwen3-30B-A3B-FP8
    - Qwen/Qwen3-235B-A22B
    - Qwen/Qwen3-235B-A22B-FP8
    - openai/gpt-oss-120b
    - openai/gpt-oss-20b
    - unsloth/gpt-oss-120b-BF16
    - unsloth/gpt-oss-20b-BF16
