# name: str
#     model_name: str
#     endpoints: default to null
#         - api_base: str
#           api_key: str
#     api_type: str
#     tokenizer: the name of LLMs on huggingface，open-source LLMs require to set this field
#     parallel: int
#     max_model_len: int

# openai
gpt-4o-2024-08-06:
    model_name: gpt-4o-2024-08-06
    endpoints: 
        - api_base: xxx
          api_key: 
    api_type: openai
    parallel: 200


    parallel: 50


# Qwen2
Qwen2-7B-Instruct:
    model_name: Qwen2-7B-Instruct
    endpoints:
        - api_base: http://localhost:80/v1
          api_key: EMPTY
    api_type: openai
    parallel: 100
    tokenizer: Qwen/Qwen2-7B-Instruct
    max_model_len: 32768


