# This file defines all models supported by the UnifiedLLMClient class.
# Each model specifies its available providers and the provider-specific model IDs.

# Quick AWS Note: some models can't be invoked with ID directly - we need to use
# a "reference profile" (e.g. Claude Haiku 4.5). Such models typically have very
# low quota limits (e.g. 2 requests per minute).

# Important: Be cautious when adding older models. Some can be very expensive.

supported_models:

  # Local model (no need for specific model name)
  - { name: local,           providers: { sglang: local, local: local } }

  # GPT
  - { name: gpt-5.1,         providers: { openai: gpt-5.1 } }
  - { name: gpt-5.1-2025-11-13, providers: { openai: gpt-5.1-2025-11-13 } }
  - { name: gpt-5,           providers: { openai: gpt-5 } }
  - { name: gpt-5-2025-08-07, providers: { openai: gpt-5-2025-08-07 } }
  - { name: gpt-5-mini,      providers: { openai: gpt-5-mini } }
  - { name: gpt-5-mini-2025-08-07, providers: { openai: gpt-5-mini-2025-08-07 } }
  - { name: gpt-5-nano,      providers: { openai: gpt-5-nano } }
  - { name: gpt-5.2-2025-12-11, providers: { openai: gpt-5.2-2025-12-11 } }
  - { name: gpt-4.1,         providers: { openai: gpt-4.1 } }
  - { name: gpt-4.1-mini,    providers: { openai: gpt-4.1-mini } }
  - { name: gpt-4.1-mini-2025-04-14, providers: { openai: gpt-4.1-mini-2025-04-14 } }
  - { name: gpt-4.1-nano,    providers: { openai: gpt-4.1-nano } }
  - { name: gpt-4o,          providers: { openai: gpt-4o } }
  - { name: gpt-4o-2024-11-20, providers: { openai: gpt-4o-2024-11-20 } }
  - { name: gpt-4o-mini,     providers: { openai: gpt-4o-mini } }
  - { name: gpt-oss-20b,     providers: { aws: openai.gpt-oss-20b-1:0 }}
  - { name: gpt-oss-120b,    providers: { aws: openai.gpt-oss-120b-1:0 }}

  # Gemini (Google)
  - { name: gemini-3-flash-preview, providers: { gemini: gemini-3-flash-preview } }
  - { name: gemini-2.5-flash-preview-09-2025, providers: { gemini: gemini-2.5-flash-preview-09-2025 } }

  # Qwen
  - { name: qwen3-235b-a22b,   providers: { aws: qwen.qwen3-235b-a22b-2507-v1:0 } }
  - { name: qwen3-32b,         providers: { aws: qwen.qwen3-32b-v1:0 } }

  # DeepSeek
  - { name: deepseek-v3.1,   providers: { aws: deepseek.v3-v1:0 } }

  # Claude
  - { name: claude-haiku-4.5,   providers: { aws: us.anthropic.claude-haiku-4-5-20251001-v1:0} }
  - { name: claude-3.5-haiku,   providers: { aws: anthropic.claude-3-5-haiku-20241022-v1:0} }
  - { name: claude-3-haiku,     providers: { aws: anthropic.claude-3-haiku-20240307-v1:0} }

  # Llama
  - { name: llama-4-maverick-17b,     providers: { aws: us.meta.llama4-maverick-17b-instruct-v1:0}}
  - { name: llama-4-scout-17b,        providers: { aws: us.meta.llama4-scout-17b-instruct-v1:0}}
  - { name: llama-3.3-instruct-70b,   providers: { aws: us.meta.llama3-3-70b-instruct-v1:0}}
  - { name: llama-3.2-instruct-90b,   providers: { aws: us.meta.llama3-2-90b-instruct-v1:0}}
  - { name: llama-3.2-instruct-11b,   providers: { aws: us.meta.llama3-2-11b-instruct-v1:0}}
  - { name: llama-3.2-instruct-3b,    providers: { aws: us.meta.llama3-2-3b-instruct-v1:0}}
  - { name: llama-3.2-instruct-1b,    providers: { aws: us.meta.llama3-2-1b-instruct-v1:0}}
  - { name: llama-3.1-instruct-70b,   providers: { aws: meta.llama3-1-70b-instruct-v1:0}}
  - { name: llama-3.1-instruct-8b,    providers: { aws: meta.llama3-1-8b-instruct-v1:0}}
