diff --git a/janus.yaml b/janus.yaml index 738f99a..aa29d9e 100644 --- a/janus.yaml +++ b/janus.yaml @@ -377,6 +377,8 @@ models: # ═══ TIER 10: Vision / Multimodal ═══ - name: "gemma-3-4b" routes: + - provider: ollama-cloud + model: "gemma3:4b-cloud" - provider: openrouter model: "google/gemma-3-4b-it" pricing: { input: 0.017, output: 0.068 } @@ -386,6 +388,8 @@ models: - name: "gemma-3-12b" routes: + - provider: ollama-cloud + model: "gemma3:12b-cloud" - provider: openrouter model: "google/gemma-3-12b-it" pricing: { input: 0.03, output: 0.10 } @@ -395,6 +399,8 @@ models: - name: "gemma-3-27b" routes: + - provider: ollama-cloud + model: "gemma3:27b-cloud" - provider: openrouter model: "google/gemma-3-27b-it" pricing: { input: 0.04, output: 0.15 } @@ -404,21 +410,33 @@ models: - name: "qwen3-vl-8b" routes: + - provider: ollama-cloud + model: "qwen3-vl:8b-cloud" - provider: openrouter model: "qwen/qwen3-vl-8b-instruct" pricing: { input: 0.08, output: 0.50 } + - provider: siliconflow + model: "Qwen/Qwen3-VL-8B-Instruct" + pricing: { input: 0.08, output: 0.50 } - provider: deepinfra model: "Qwen/Qwen3-VL-8B-Instruct" pricing: { input: 0.18, output: 0.69 } - name: "qwen3-vl-32b" routes: + - provider: ollama-cloud + model: "qwen3-vl:32b-cloud" - provider: openrouter model: "qwen/qwen3-vl-32b-instruct" pricing: { input: 0.104, output: 0.416 } + - provider: siliconflow + model: "Qwen/Qwen3-VL-32B-Instruct" + pricing: { input: 0.20, output: 0.60 } - name: "qwen2.5-vl-32b" routes: + - provider: ollama-cloud + model: "qwen2.5vl:32b-cloud" - provider: openrouter model: "qwen/qwen2.5-vl-32b-instruct" pricing: { input: 0.05, output: 0.22 } @@ -426,6 +444,45 @@ models: model: "Qwen/Qwen2.5-VL-32B-Instruct" pricing: { input: 0.20, output: 0.60 } + - name: "llama-3.2-11b-vision" + routes: + - provider: deepinfra + model: "meta-llama/Llama-3.2-11B-Vision-Instruct" + pricing: { input: 0.049, output: 0.049 } + - provider: groq + model: "llama-3.2-11b-vision-preview" + pricing: { input: 0.05, output: 0.08 } + - provider: openrouter + model: "meta-llama/llama-3.2-11b-vision-instruct" + pricing: { input: 0.049, output: 0.049 } + + - name: "pixtral-12b" + routes: + - provider: deepinfra + model: "mistralai/Pixtral-12B-2409" + pricing: { input: 0.15, output: 0.15 } + - provider: openrouter + model: "mistralai/pixtral-12b" + pricing: { input: 0.125, output: 0.125 } + + - name: "kimi-vl-a3b-thinking" + routes: + - provider: openrouter + model: "moonshotai/kimi-vl-a3b-thinking" + pricing: { input: 0.025, output: 0.10 } + + - name: "gemini-2.0-flash" + routes: + - provider: openrouter + model: "google/gemini-2.0-flash-001" + pricing: { input: 0.10, output: 0.40 } + + - name: "gemini-2.0-flash-lite" + routes: + - provider: openrouter + model: "google/gemini-2.0-flash-lite-001" + pricing: { input: 0.075, output: 0.30 } + - name: "claude-sonnet" routes: - provider: openrouter