open-webui/litellm-config.yaml
2025-02-26 14:22:58 +01:00

72 lines
2.2 KiB
YAML

litellm_settings:
debug: true
verbose: true
load_env_variables: true
model_list:
- model_name: "GPT 4o"
litellm_params:
model: "azure/gpt-4o"
api_base: os.environ/AZURE_OPENAI_API_BASE_URL
api_key: os.environ/AZURE_OPENAI_API_KEY
max_tokens: 800
model_info:
description: "OpenAI's most advanced model, ideal for complex tasks."
arena_elo: 1287
knowledge_cutoff: "October 2023"
context_window: 128000
- model_name: "GPT 3.5 Turbo"
litellm_params:
model: "azure/gpt-35-turbo"
api_base: os.environ/AZURE_OPENAI_API_BASE_URL
api_key: os.environ/AZURE_OPENAI_API_KEY
max_tokens: 800
model_info:
description: "OpenAI's cheaper model for less complex tasks."
arena_elo: 1116
knowledge_cutoff: "September 2021"
context_window: 16000
- model_name: 'Claude 3 Haiku'
litellm_params:
model: 'vertex_ai/claude-3-haiku@20240307'
vertex_project: 'testllm-94944'
vertex_location: 'europe-west4'
model_info:
description: 'Lightning-fast responses for simple queries.'
arena_elo: 1178
knowledge_cutoff: 'August 2023'
context_window: 200_000
- model_name: 'Claude 3.5 Sonnet'
litellm_params:
model: 'vertex_ai/claude-3-5-sonnet@20240620'
vertex_project: 'testllm-94944'
vertex_location: 'europe-west1'
model_info:
description: "Anthropic's latest model."
arena_elo: 1271
knowledge_cutoff: 'August 2023'
context_window: 200_000
- model_name: 'Gemini 1.5 Pro'
litellm_params:
model: 'gemini-1.5-pro'
vertex_project: 'testllm-94944'
vertex_location: 'europe-west3'
model_info:
description: "Google's leading model with a very large context window."
arena_elo: 1265
knowledge_cutoff: 'November 2023'
context_window: 2_000_000
- model_name: 'Gemini 1.5 Flash'
litellm_params:
model: 'gemini-1.5-flash-001'
vertex_project: 'testllm-94944'
vertex_location: 'europe-west3'
model_info:
description: 'Optimized for speed and efficiency.'
arena_elo: 1231
knowledge_cutoff: 'November 2023'
context_window: 1_000_000
general_settings: {}