model_list:
  # GPT-4 models (gpt-4-turbo-2024-04-09)
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-0409
      api_base: https://3-openai-swedencentral.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 900
      tpm: 150000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-0409
      api_base: https://4-openai-swedencentral.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 900
      tpm: 150000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-0409
      api_base: https://5-openai-swedencentral.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 900
      tpm: 150000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://3-openai-australiaeast.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 480
      tpm: 80000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://3-openai-canadaeast.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 480
      tpm: 80000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://3-openai-francecentral.openai.azure.com/
      api_version: 2024-02-15-preview
      aws_region_name: sweden-central
      rpm: 900
      tpm: 150000
      input_cost_per_token: 1e-5
      output_cost_per_token: 3e-5
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://4-openai-australiaeast.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 480
      tpm: 80000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://4-openai-canadaeast.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 480
      tpm: 80000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://5-openai-australiaeast.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 480
      tpm: 80000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://5-openai-canadaeast.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 480
      tpm: 80000
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-4-1106
      api_base: https://5-openai-francecentral.openai.azure.com/
      api_version: 2024-02-15-preview
      rpm: 480
      tpm: 80000
  # Claude Opus (claude-3-opus-20240229)
  - model_name: claude-opus
    litellm_params:
      model: claude-3-opus-20240229
      rpm: 1000
      tpm: 40000
  - model_name: claude-opus
    litellm_params:
      model: claude-3-opus-20240229
      rpm: 1000
      tpm: 40000
  - model_name: claude-opus
    litellm_params:
      model: claude-3-opus-20240229
      rpm: 1000
      tpm: 40000
  - model_name: claude-opus
    litellm_params:
      model: claude-3-opus-20240229
      rpm: 1000
      tpm: 40000
  - model_name: claude-opus
    litellm_params:
      model: claude-3-opus-20240229
      rpm: 1000
      tpm: 40000
  - model_name: claude-opus
    litellm_params:
      model: claude-3-opus-20240229
      rpm: 1000
      tpm: 40000
  # Gemini 1.5 Pro (gemini-1.5-pro-latest)
  - model_name: gemini-1.5
    litellm_params:
      model: gemini/gemini-1.5-pro-latest
      rpm: 360
      tpm: 200000
  - model_name: gemini-1.5
    litellm_params:
      model: gemini/gemini-1.5-pro-latest
      rpm: 360
      tpm: 200000
  - model_name: gemini-1.5
    litellm_params:
      model: gemini/gemini-1.5-pro-latest
      rpm: 360
      tpm: 200000
  - model_name: gemini-1.5
    litellm_params:
      model: gemini/gemini-1.5-pro-latest
      rpm: 360
      tpm: 200000
  - model_name: gemini-1.5
    litellm_params:
      model: gemini/gemini-1.5-pro-latest
      rpm: 360
      tpm: 200000
  - model_name: gemini-1.5
    litellm_params:
      model: gemini/gemini-1.5-pro-latest
      rpm: 360
      tpm: 200000
  # Llama3 70B (llama3:70b-instruct-q5_K_M)
  - model_name: llama3-70b
    litellm_params:
      model: ollama_chat/llama3:70b-instruct-q5_K_M
      api_base: https://17hk1lm3hg6nqf-11434.proxy.runpod.net
  - model_name: llama3-70b
    litellm_params:
      model: ollama_chat/llama3:70b-instruct-q5_K_M
      api_base: https://zkilvluvenmfov-11434.proxy.runpod.net
  # QWen 1.5 110B (qwen:110b-chat-v1.5-q5_K_M)
  - model_name: qwen-110b
    litellm_params:
      model: ollama_chat/qwen:110b-chat-v1.5-q5_K_M
      api_base: https://87z18f2vkxspmg-11434.proxy.runpod.net
  - model_name: qwen-110b
    litellm_params:
      model: ollama_chat/qwen:110b-chat-v1.5-q5_K_M
      api_base: https://boe3b76kcsboic-11434.proxy.runpod.net
  # Mixtral 8x22B (mixtral:8x22b-instruct-v0.1-q5_K_M)
  - model_name: mixtral-8x22b
    litellm_params:
      model: ollama_chat/mixtral:8x22b-instruct-v0.1-q5_K_M
      api_base: https://dw37f85e3to8e2-11434.proxy.runpod.net
  - model_name: mixtral-8x22b
    litellm_params:
      model: ollama_chat/mixtral:8x22b-instruct-v0.1-q5_K_M
      api_base: https://uqolzw71uu9snm-11434.proxy.runpod.net



router_settings:
  routing_strategy: usage-based-routing-v2
  redis_host: redis-14774.c281.us-east-1-2.ec2.redns.redis-cloud.com
  redis_port: 14774
  enable_pre_call_check: true
  num_retries: 3
  timeout: 150

litellm_settings:
  num_retries: 3
  allowed_fails: 3
  request_timeout: 150


general_settings:
  store_model_in_db: true


# environment_variables:
