# Judge Configuration File for LiteLLM Framework
# This file defines Judge's Verdict models using the liteLLM framework
# LiteLLM provides unified interface for multiple LLM providers
# IMPORTANT: Model identifiers (keys) must exactly match the folder names in results/

# Default values applied to all models unless overridden
defaults:
  temperature: 0.0
  max_tokens: 8
  num_workers: 16
  timeout: 60
  max_retries: 3

# Model configurations using liteLLM framework
# Key names MUST match the folder names in results/
models:
  # OpenAI models
  gpt-4o:
    framework: litellm
    model: openai/gpt-4o
    num_workers: 2
    
  gpt-4o-mini:
    framework: litellm
    model: openai/gpt-4o-mini
    num_workers: 2
    
  gpt-4:
    framework: litellm
    model: openai/gpt-4
    num_workers: 1
    
  gpt-4.1:
    framework: litellm
    model: openai/gpt-4.1
    num_workers: 2
    
  gpt-4.1-mini:
    framework: litellm
    model: openai/gpt-4.1-mini
    num_workers: 2
    
  gpt-4.5:
    framework: litellm
    model: openai/gpt-4.5
    num_workers: 2
    
  gpt-5-chat:
    framework: litellm
    model: openai/gpt-5-chat
    num_workers: 1
    
  # Claude model
  claude-sonnet-4:
    framework: litellm
    model: anthropic/claude-sonnet-4-20250514
    num_workers: 2
    
  # Meta Llama models (via NVIDIA NIM)
  meta_llama-3.1-70b-instruct:
    framework: litellm
    model: nvidia_nim/meta/llama-3.1-70b-instruct
    num_workers: 4
    
  meta_llama-3.2-3b-instruct:
    framework: litellm
    model: nvidia_nim/meta/llama-3.2-3b-instruct
    num_workers: 24
    
  meta_llama-3.2-1b-instruct:
    framework: litellm
    model: nvidia_nim/meta/llama-3.2-1b-instruct
    num_workers: 32
    
  meta_llama-3.1-8b-instruct:
    framework: litellm
    model: nvidia_nim/meta/llama-3.1-8b-instruct
    num_workers: 24
    
  meta_llama-3.1-405b-instruct:
    framework: litellm
    model: nvidia_nim/meta/llama-3.1-405b-instruct
    num_workers: 2
    
  # Llama 4 models (experimental/preview)
  meta_llama-4-scout-17b-16e-instruct:
    framework: litellm
    model: nvidia_nim/meta/llama-4-scout-17b-16e-instruct
    num_workers: 16
    
  meta_llama-4-maverick-17b-128e-instruct:
    framework: litellm
    model: nvidia_nim/meta/llama-4-maverick-17b-128e-instruct
    num_workers: 4
    
  # NVIDIA Nemotron models
  nvidia_llama-3.1-nemotron-70b-instruct:
    framework: litellm
    model: nvidia_nim/nvidia/llama-3.1-nemotron-70b-instruct
    num_workers: 4
    
  nvidia_llama-3.1-nemotron-ultra-253b-v1:
    framework: litellm
    model: nvidia_nim/nvidia/llama-3.1-nemotron-ultra-253b-v1
    num_workers: 4
    
  nvidia_llama-3.3-nemotron-super-49b-v1:
    framework: litellm
    model: nvidia_nim/nvidia/llama-3.3-nemotron-super-49b-v1
    num_workers: 8
    
  nvidia_llama-3.1-nemotron-nano-8b-v1:
    framework: litellm
    model: nvidia_nim/nvidia/llama-3.1-nemotron-nano-8b-v1
    num_workers: 1
    
  nvidia_nemotron-mini-4b-instruct:
    framework: litellm
    model: nvidia_nim/nvidia/nemotron-mini-4b-instruct
    num_workers: 8
    
  # Mistral models
  mistralai_mixtral-8x22b-instruct-v0.1:
    framework: litellm
    model: nvidia_nim/mistralai/mixtral-8x22b-instruct-v0.1
    num_workers: 8
    
  nv-mistralai_mistral-nemo-12b-instruct:
    framework: litellm
    model: nvidia_nim/nv-mistralai/mistral-nemo-12b-instruct
    num_workers: 16
    
  # Google Gemma models
  google_gemma-2-2b-it:
    framework: litellm
    model: nvidia_nim/google/gemma-2-2b-it
    num_workers: 32
    
  google_gemma-3-27b-it:
    framework: litellm
    model: nvidia_nim/google/gemma-3-27b-it
    num_workers: 8
    
  # OpenAI OSS models (may require custom endpoint or local deployment)
  openai_gpt-oss-20b:
    framework: litellm
    model: nvidia_nim/openai/gpt-oss-20b
    num_workers: 1
    
  openai_gpt-oss-120b:
    framework: litellm
    model: nvidia_nim/openai/gpt-oss-120b
    num_workers: 1