
model_load_config={
    "Llama-3-70B-Instruct":
    {
        "model_name": "/mnt/data/huggingface/hub/models--meta-llama--Meta-Llama-3-70B-Instruct/snapshots/1480bb72e06591eb87b0ebe2c8853127f9697bae/",
        "tag_name": "Llama-3-70B-Instruct",
        "url": "http://localhost:2010/v1/completions",
        "mode": "prompt"
    },
    "Llama-3-70B-Instruct-12":
    { 
        "model_name":  "meta-llama/Meta-Llama-3-70B-Instruct",
        "tag_name": "Llama-3-70B-Instruct",
        "url": "http://172.18.131.12:8000/v1/completions",
        "mode": "prompt",
        "remote": True,
        "local_path":"/mnt/data/huggingface/hub/models--meta-llama--Meta-Llama-3-70B-Instruct/snapshots/1480bb72e06591eb87b0ebe2c8853127f9697bae/",
    },
    "Llama-3-8B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--meta-llama--Meta-Llama-3-8B-Instruct/snapshots/a8977699a3d0820e80129fb3c93c20fbd9972c41/",
        "tag_name": "Llama-3-8B-Instruct",
        "url":"http://localhost:2000/v1/completions" ,
        "mode": "prompt"
    },
    "Llama-3-8B-Instruct-2":
    {
        "model_name":"/mnt/data/huggingface/hub/models--meta-llama--Meta-Llama-3-8B-Instruct/snapshots/a8977699a3d0820e80129fb3c93c20fbd9972c41/",
        "tag_name": "Llama-3-8B-Instruct",
        "url":"http://localhost:2010/v1/completions" ,
        "mode": "prompt"
    },
    "Llama-3-8B-Instruct-3":
    {
        "model_name":"/mnt/data/huggingface/hub/models--meta-llama--Meta-Llama-3-8B-Instruct/snapshots/a8977699a3d0820e80129fb3c93c20fbd9972c41/",
        "tag_name": "Llama-3-8B-Instruct",
        "url":"http://localhost:2011/v1/completions" ,
        "mode": "prompt"
    },
    "Llama-3-8B-Instruct-4":
    {
        "model_name":"/mnt/data/huggingface/hub/models--meta-llama--Meta-Llama-3-8B-Instruct/snapshots/a8977699a3d0820e80129fb3c93c20fbd9972c41/",
        "tag_name": "Llama-3-8B-Instruct",
        "url":"http://localhost:2012/v1/completions" ,
        "mode": "prompt"
    },
    "Qwen2-72B-Instruct-144":
    {
        "model_name":"Qwen/Qwen2-72B-Instruct",
        "tag_name": "Qwen2-72B-Instruct-144",
        "url":"http://210.75.240.144:3006/v1/chat/completions" ,
        "mode": "chat",
        "remote": True
    },
    "Qwen2-72B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2-72B-Instruct/snapshots/1af63c698f59c4235668ec9c1395468cb7cd7e79/",
        "tag_name": "Qwen2-72B-Instruct",
        "url":"http://localhost:2011/v1/completions" ,
        "mode": "prompt"
    },
    "Mistral-7B-Instruct-v0.3":
    {
        "model_name":"/mnt/data/huggingface/hub/models--mistralai--Mistral-7B-Instruct-v0.3/snapshots/0417f4babd26db0b5ed07c1d0bc85658ab526ea3/",
        "tag_name": "Mistral-7B-Instruct-v0.3",
        "url":"http://localhost:2002/v1/completions" ,
        "mode": "prompt"
    },

    "Llama-2-7b-chat-hf":
    {
        "model_name":"/mnt/data/huggingface/hub/models--meta-llama--Llama-2-7b-chat-hf/snapshots/f5db02db724555f92da89c216ac04704f23d4590/",
        "tag_name": "Llama-2-7b-chat-hf",
        "url":"http://localhost:2005/v1/completions" ,
        "mode": "prompt"
    },
    "gemma-2-9b-it":
    {
        "model_name":"/mnt/data/huggingface/hub/models--google--gemma-2-9b-it/snapshots/11c9b309abf73637e4b6f9a3fa1e92e615547819/",
        "tag_name": "gemma-2-9b-it",
        "url":"http://localhost:2003/v1/completions" ,
        "mode": "prompt"
    },
    "Qwen2-7B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2-7B-Instruct/snapshots/41c66b0be1c3081f13defc6bdf946c2ef240d6a6/",
        "tag_name": "Qwen2-7B-Instruct",
        "url":"http://localhost:2004/v1/completions" ,
        "mode": "prompt"
    },
    "Qwen2-1.5B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2-1.5B-Instruct/snapshots/ba1cf1846d7df0a0591d6c00649f57e798519da8/",
        "tag_name": "Qwen2-1.5B-Instruct",
        "url":"http://localhost:2007/v1/completions" ,
        "mode": "prompt"
    },
    "Llama-2-13b-chat-hf":
    {
        "model_name":"/mnt/data/huggingface/hub/models--meta-llama--Llama-2-13b-chat-hf/snapshots/a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8/",
        "tag_name": "Llama-2-13b-chat-hf",
        "url":"http://localhost:2007/v1/completions" ,
        "mode": "prompt"
    },
    "Phi-3-mini-4k-instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--microsoft--Phi-3-mini-4k-instruct/snapshots/5a516f86087853f9d560c95eb9209c1d4ed9ff69/",
        "tag_name": "Phi-3-mini-4k-instruct",
        "url":"http://localhost:2006/v1/completions" ,
        "mode": "prompt"
    },
    "vicuna-7b-v1.5":
    {
        "model_name":"/mnt/data/huggingface/hub/models--lmsys--vicuna-7b-v1.5/snapshots/3321f76e3f527bd14065daf69dad9344000a201d/",
        "tag_name": "vicuna-7b-v1.5",
        "url":"http://localhost:2001/v1/completions" ,
        "mode": "prompt",
        "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user\\'s questions.' %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 %}{{ system_message }}{% endif %}{% if message['role'] == 'user' %}{{ ' USER: ' + message['content'].strip() }}{% elif message['role'] == 'assistant' %}{{ ' ASSISTANT: ' + message['content'].strip() + eos_token }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ ' ASSISTANT:' }}{% endif %}",
    },
    "Qwen2.5-3B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2.5-3B-Instruct/snapshots/82f42baa094a9600e39ccd80d34058aeeb3abbc1/",
        "tag_name": "Qwen2.5-3B-Instruct",
        "url":"http://localhost:2031/v1/completions" ,
        "mode": "prompt" 
    },
    "Qwen2.5-7B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2.5-7B-Instruct/snapshots/acbd96531cda22292a3ceaa67e984955d3965282/",
        "tag_name": "Qwen2.5-7B-Instruct",
        "url":"http://localhost:2032/v1/completions" ,
        "mode": "prompt" 
    },
    "Qwen2.5-7B-Instruct-2":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2.5-7B-Instruct/snapshots/acbd96531cda22292a3ceaa67e984955d3965282/",
        "tag_name": "Qwen2.5-7B-Instruct",
        "url":"http://localhost:2035/v1/completions" ,
        "mode": "prompt" 
    },
    "Qwen2.5-14B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2.5-14B-Instruct/snapshots/502e5d8bfd665ed113fd9b3626445ca7b0596303/",
        "tag_name": "Qwen2.5-14B-Instruct",
        "url":"http://localhost:2033/v1/completions" ,
        "mode": "prompt" 
    },
    "Qwen2.5-32B-Instruct":
    {
        "model_name":"/mnt/data/huggingface/hub/models--Qwen--Qwen2.5-32B-Instruct/snapshots/70e8dfb9ad18a7d499f765fe206ff065ed8ca197/",
        "tag_name": "Qwen2.5-32B-Instruct",
        "url":"http://localhost:2034/v1/completions" ,
        "mode": "prompt" 
    },
    "match":
    {
        "tag_name": "match",
        "mode": "match" 
    },
}


 


 