refactor(gateway): reorder and restructure llama-3.3-70b model routes in configuration

This commit is contained in:
Ray Andrew 2026-02-16 13:09:51 -06:00
parent c949498a7d
commit c60f14e002
Signed by: rayandrew
SSH key fingerprint: SHA256:EUCV+qCSqkap8rR+p+zGjxHfKI06G0GJKgo1DIOniQY

View file

@ -117,18 +117,6 @@ models:
# model: "stepfun/step-3.5-flash:free"
# ═══ TIER 2: Low cost (Groq, Cerebras — free tier with rate limits) ═══
- name: "llama-3.3-70b"
routes:
- provider: groq
model: "llama-3.3-70b-versatile"
pricing: { input: 0.59, output: 0.79 }
- provider: deepinfra
model: "meta-llama/Llama-3.3-70B-Instruct-Turbo"
pricing: { input: 0.23, output: 0.40 }
- provider: cerebras
model: "llama-3.3-70b"
pricing: { input: 0.85, output: 1.20 }
- name: "llama-3.1-8b"
routes:
- provider: groq
@ -141,6 +129,18 @@ models:
model: "meta-llama/Meta-Llama-3.1-8B-Instruct"
pricing: { input: 0.03, output: 0.05 }
- name: "llama-3.3-70b"
routes:
- provider: deepinfra
model: "meta-llama/Llama-3.3-70B-Instruct-Turbo"
pricing: { input: 0.23, output: 0.40 }
- provider: groq
model: "llama-3.3-70b-versatile"
pricing: { input: 0.59, output: 0.79 }
- provider: cerebras
model: "llama-3.3-70b"
pricing: { input: 0.85, output: 1.20 }
- name: "gpt-oss"
routes:
- provider: groq