ai-servers/litellm/config.yaml

90 lines
2.5 KiB
YAML

model_list:
# --- OpenRouter models ---
- model_name: kimi-k2.5
litellm_params:
model: openrouter/moonshotai/kimi-k2.5
api_key: os.environ/OPENROUTER_API_KEY
- model_name: devstral
litellm_params:
model: openrouter/mistralai/devstral-small
api_key: os.environ/OPENROUTER_API_KEY
- model_name: minimax-m2
litellm_params:
model: openrouter/minimax/minimax-m1
api_key: os.environ/OPENROUTER_API_KEY
- model_name: gpt-oss
litellm_params:
model: openrouter/openai/gpt-4.1-mini
api_key: os.environ/OPENROUTER_API_KEY
# --- OpenRouter models (writing) ---
- model_name: gemini-2.5-pro
litellm_params:
model: openrouter/google/gemini-2.5-pro-preview
api_key: os.environ/OPENROUTER_API_KEY
- model_name: claude-sonnet
litellm_params:
model: openrouter/anthropic/claude-sonnet-4
api_key: os.environ/OPENROUTER_API_KEY
- model_name: gpt-4.1
litellm_params:
model: openrouter/openai/gpt-4.1
api_key: os.environ/OPENROUTER_API_KEY
- model_name: deepseek-v3
litellm_params:
model: openrouter/deepseek/deepseek-chat-v3-0324:free
api_key: os.environ/OPENROUTER_API_KEY
# --- SiliconFlow models ---
- model_name: glm-4.7
litellm_params:
model: openai/THUDM/GLM-4-32B-0414
api_base: https://api.siliconflow.cn/v1
api_key: os.environ/SILICONFLOW_API_KEY
- model_name: qwen3-coder
litellm_params:
model: openai/Qwen/Qwen3-Coder
api_base: https://api.siliconflow.cn/v1
api_key: os.environ/SILICONFLOW_API_KEY
# --- DeepInfra models ---
- model_name: deepseek-v3.2
litellm_params:
model: deepinfra/deepseek-ai/DeepSeek-V3-0324
api_key: os.environ/DEEPINFRA_API_KEY
- model_name: devstral-deepinfra
litellm_params:
model: deepinfra/mistralai/Devstral-Small-2505
api_key: os.environ/DEEPINFRA_API_KEY
- model_name: deepseek-r1
litellm_params:
model: deepinfra/deepseek-ai/DeepSeek-R1
api_key: os.environ/DEEPINFRA_API_KEY
# --- Groq (free/fast) ---
- model_name: llama-3.3-70b
litellm_params:
model: groq/llama-3.3-70b-versatile
api_key: os.environ/GROQ_API_KEY
# --- Cerebras (free/fast) ---
- model_name: llama-3.3-70b-cerebras
litellm_params:
model: cerebras/llama-3.3-70b
api_key: os.environ/CEREBRAS_API_KEY
general_settings:
master_key: os.environ/LITELLM_MASTER_KEY
litellm_settings:
drop_params: true
set_verbose: false