fix: update pricing and routes for gemma, qwen, and pixtral models

This commit is contained in:
Ray Andrew 2026-02-18 02:43:31 -06:00
parent 05d71ba07c
commit f63d2d0956
Signed by: rayandrew
SSH key fingerprint: SHA256:EUCV+qCSqkap8rR+p+zGjxHfKI06G0GJKgo1DIOniQY

View file

@ -384,7 +384,7 @@ models:
pricing: { input: 0.017, output: 0.068 } pricing: { input: 0.017, output: 0.068 }
- provider: deepinfra - provider: deepinfra
model: "google/gemma-3-4b-it" model: "google/gemma-3-4b-it"
pricing: { input: 0.04, output: 0.08 } pricing: { input: 0.02, output: 0.04 }
- name: "gemma-3-12b" - name: "gemma-3-12b"
routes: routes:
@ -392,7 +392,7 @@ models:
model: "gemma3:12b-cloud" model: "gemma3:12b-cloud"
- provider: openrouter - provider: openrouter
model: "google/gemma-3-12b-it" model: "google/gemma-3-12b-it"
pricing: { input: 0.03, output: 0.10 } pricing: { input: 0.04, output: 0.13 }
- provider: deepinfra - provider: deepinfra
model: "google/gemma-3-12b-it" model: "google/gemma-3-12b-it"
pricing: { input: 0.04, output: 0.13 } pricing: { input: 0.04, output: 0.13 }
@ -426,20 +426,25 @@ models:
routes: routes:
- provider: ollama-cloud - provider: ollama-cloud
model: "qwen3-vl:32b-cloud" model: "qwen3-vl:32b-cloud"
- provider: openrouter
model: "qwen/qwen3-vl-32b-instruct"
pricing: { input: 0.104, output: 0.416 }
- provider: siliconflow - provider: siliconflow
model: "Qwen/Qwen3-VL-32B-Instruct" model: "Qwen/Qwen3-VL-32B-Instruct"
pricing: { input: 0.20, output: 0.60 } pricing: { input: 0.20, output: 0.60 }
- name: "qwen2.5-vl-7b"
routes:
- provider: ollama-cloud
model: "qwen2.5vl:7b-cloud"
- provider: openrouter
model: "qwen/qwen-2.5-vl-7b-instruct"
pricing: { input: 0.20, output: 0.20 }
- name: "qwen2.5-vl-32b" - name: "qwen2.5-vl-32b"
routes: routes:
- provider: ollama-cloud - provider: ollama-cloud
model: "qwen2.5vl:32b-cloud" model: "qwen2.5vl:32b-cloud"
- provider: openrouter - provider: openrouter
model: "qwen/qwen2.5-vl-32b-instruct" model: "qwen/qwen2.5-vl-32b-instruct"
pricing: { input: 0.05, output: 0.22 } pricing: { input: 0.20, output: 0.60 }
- provider: deepinfra - provider: deepinfra
model: "Qwen/Qwen2.5-VL-32B-Instruct" model: "Qwen/Qwen2.5-VL-32B-Instruct"
pricing: { input: 0.20, output: 0.60 } pricing: { input: 0.20, output: 0.60 }
@ -458,31 +463,16 @@ models:
- name: "pixtral-12b" - name: "pixtral-12b"
routes: routes:
- provider: deepinfra
model: "mistralai/Pixtral-12B-2409"
pricing: { input: 0.15, output: 0.15 }
- provider: openrouter - provider: openrouter
model: "mistralai/pixtral-12b" model: "mistralai/pixtral-12b"
pricing: { input: 0.125, output: 0.125 } pricing: { input: 0.15, output: 0.15 }
- name: "kimi-vl-a3b-thinking" - name: "gemini-2.5-flash-lite"
routes: routes:
- provider: openrouter - provider: openrouter
model: "moonshotai/kimi-vl-a3b-thinking" model: "google/gemini-2.5-flash-lite"
pricing: { input: 0.025, output: 0.10 }
- name: "gemini-2.0-flash"
routes:
- provider: openrouter
model: "google/gemini-2.0-flash-001"
pricing: { input: 0.10, output: 0.40 } pricing: { input: 0.10, output: 0.40 }
- name: "gemini-2.0-flash-lite"
routes:
- provider: openrouter
model: "google/gemini-2.0-flash-lite-001"
pricing: { input: 0.075, output: 0.30 }
- name: "claude-sonnet" - name: "claude-sonnet"
routes: routes:
- provider: openrouter - provider: openrouter