defaults:
  temperature: 0.0
  max_tokens: 8
  num_workers: 16
  timeout: 60
  max_retries: 3
  is_closed: false
models:
  meta_llama-3.1-70b-instruct:
    framework: nvdev
    model: meta/llama-3.1-70b-instruct
    num_workers: 4
  meta_llama-3.2-3b-instruct:
    framework: nvdev
    model: meta/llama-3.2-3b-instruct
    num_workers: 24
  meta_llama-3.2-1b-instruct:
    framework: nvdev
    model: meta/llama-3.2-1b-instruct
    num_workers: 32
  meta_llama-3.1-8b-instruct:
    framework: nvdev
    model: meta/llama-3.1-8b-instruct
    num_workers: 24
  meta_llama-3.1-405b-instruct:
    framework: nvdev
    model: meta/llama-3.1-405b-instruct
    num_workers: 2
  nvidia_llama-3.1-nemotron-70b-instruct:
    framework: nvdev
    model: nvidia/llama-3.1-nemotron-70b-instruct
    num_workers: 4
  nvidia_llama-3.1-nemotron-ultra-253b-v1:
    framework: nvdev
    model: nvidia/llama-3.1-nemotron-ultra-253b-v1
    num_workers: 4
  nvidia_llama-3.3-nemotron-super-49b-v1:
    framework: nvdev
    model: nvidia/llama-3.3-nemotron-super-49b-v1
    num_workers: 8
  nvidia_llama-3.1-nemotron-nano-8b-v1:
    framework: nvdev
    model: nvidia/llama-3.1-nemotron-nano-8b-v1
    num_workers: 1
  nvidia_nemotron-mini-4b-instruct:
    framework: nvdev
    model: nvidia/nemotron-mini-4b-instruct
    num_workers: 8
  mistralai_mixtral-8x22b-instruct-v0.1:
    framework: nvdev
    model: mistralai/mixtral-8x22b-instruct-v0.1
    num_workers: 8
  nv-mistralai_mistral-nemo-12b-instruct:
    framework: nvdev
    model: nv-mistralai/mistral-nemo-12b-instruct
    num_workers: 16
  google_gemma-2-2b-it:
    framework: nvdev
    model: google/gemma-2-2b-it
    num_workers: 32
  google_gemma-3-27b-it:
    framework: nvdev
    model: google/gemma-3-27b-it
    num_workers: 8
  meta_llama-4-scout-17b-16e-instruct:
    framework: nvdev
    model: meta/llama-4-scout-17b-16e-instruct
    num_workers: 16
  meta_llama-4-maverick-17b-128e-instruct:
    framework: nvdev
    model: meta/llama-4-maverick-17b-128e-instruct
    num_workers: 4
  openai_gpt-oss-20b:
    framework: nvdev
    model: openai/gpt-oss-20b
    num_workers: 1
  openai_gpt-oss-120b:
    framework: nvdev
    model: openai/gpt-oss-120b
    num_workers: 1
  gpt-4o:
    framework: oneapi
    model: gpt-4o
    deployment: gpt-4o-20241120
    api_version: 2024-12-01-preview
    num_workers: 2
    is_closed: true
  gpt-4o-mini:
    framework: oneapi
    model: gpt-4o-mini
    deployment: gpt-4o-mini-20240718
    api_version: 2024-12-01-preview
    num_workers: 2
    is_closed: true
  gpt-4:
    framework: oneapi
    model: gpt-4
    deployment: gpt-4
    api_version: 2024-12-01-preview
    num_workers: 1
    is_closed: true
  gpt-4.1:
    framework: oneapi
    model: gpt-4.1
    deployment: gpt-4.1-20250414
    api_version: 2024-12-01-preview
    num_workers: 2
    is_closed: true
  gpt-4.1-mini:
    framework: oneapi
    model: gpt-4.1-mini
    deployment: gpt-4.1-mini-20250414
    api_version: 2024-12-01-preview
    num_workers: 2
    is_closed: true
  gpt-4.5:
    framework: oneapi
    model: gpt-4.5
    deployment: gpt-4.5-preview-20250227
    api_version: 2024-12-01-preview
    num_workers: 2
    is_closed: true
  gpt-5-chat:
    framework: oneapi
    model: gpt-5-chat
    deployment: gpt-5-chat-20250807
    api_version: 2025-04-01-preview
    num_workers: 1
    is_closed: true
  claude-sonnet-4:
    framework: oneapi
    model: claude-sonnet-4
    deployment: claude-sonnet-4-20250514
    api_version: 2025-04-01-preview
    num_workers: 2
    is_closed: true
