From 3549abec3630a2876c03873cded637eabb92aada Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:09:05 +0000 Subject: [PATCH 1/8] feat: add LLM Gateway provider with 153 models MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Add LLM Gateway (llmgateway.io) as a new provider with all supported models organized by upstream provider subdirectory. LLM Gateway is an OpenAI-compatible API gateway that provides unified access to 40+ LLM providers through a single API endpoint. Directory structure: providers/llmgateway/ ├── provider.toml ├── README.md ├── scripts/ │ └── generate.ts └── models/ ├── anthropic/ (16 models) ├── openai/ (28 models) ├── google/ (19 models) ├── zai/ (17 models - GLM, CogView) ├── alibaba/ (27 models - Qwen) ├── meta/ (12 models - Llama) ├── xai/ (9 models - Grok) ├── deepseek/ (5 models) ├── bytedance/ (6 models - Seed) ├── moonshot/ (4 models - Kimi) ├── mistral/ (3 models) ├── perplexity/ (3 models - Sonar) ├── minimax/ (1 model) ├── nvidia/ (1 model) └── llmgateway/ (2 models - auto, custom) Co-Authored-By: Claude Opus 4.5 --- providers/llmgateway/README.md | 68 +++++++++++++++++++ providers/llmgateway/logo.svg | 4 ++ .../llmgateway/models/alibaba/qwen-flash.toml | 22 ++++++ .../alibaba/qwen-image-max-2025-12-30.toml | 22 ++++++ .../models/alibaba/qwen-image-max.toml | 22 ++++++ .../models/alibaba/qwen-image-plus.toml | 22 ++++++ .../llmgateway/models/alibaba/qwen-image.toml | 22 ++++++ .../models/alibaba/qwen-max-latest.toml | 22 ++++++ .../llmgateway/models/alibaba/qwen-max.toml | 22 ++++++ .../models/alibaba/qwen-omni-turbo.toml | 22 ++++++ .../models/alibaba/qwen-plus-latest.toml | 22 ++++++ .../llmgateway/models/alibaba/qwen-plus.toml | 22 ++++++ .../llmgateway/models/alibaba/qwen-turbo.toml | 22 ++++++ .../models/alibaba/qwen-vl-max.toml | 22 ++++++ .../models/alibaba/qwen-vl-plus.toml | 22 ++++++ .../alibaba/qwen2-5-vl-72b-instruct.toml | 22 ++++++ .../models/alibaba/qwen25-coder-7b.toml | 22 ++++++ .../qwen3-235b-a22b-instruct-2507.toml | 23 +++++++ .../qwen3-235b-a22b-thinking-2507.toml | 23 +++++++ .../alibaba/qwen3-30b-a3b-instruct-2507.toml | 22 ++++++ .../alibaba/qwen3-30b-a3b-thinking-2507.toml | 22 ++++++ .../llmgateway/models/alibaba/qwen3-32b.toml | 22 ++++++ .../alibaba/qwen3-coder-30b-a3b-instruct.toml | 22 ++++++ .../qwen3-coder-480b-a35b-instruct.toml | 22 ++++++ .../models/alibaba/qwen3-coder-plus.toml | 22 ++++++ .../models/alibaba/qwen3-coder.toml | 22 ++++++ .../llmgateway/models/alibaba/qwen3-max.toml | 23 +++++++ .../alibaba/qwen3-next-80b-a3b-instruct.toml | 22 ++++++ .../alibaba/qwen3-next-80b-a3b-thinking.toml | 23 +++++++ .../anthropic/claude-3-5-haiku-20241022.toml | 24 +++++++ .../models/anthropic/claude-3-5-haiku.toml | 23 +++++++ .../anthropic/claude-3-5-sonnet-20240620.toml | 23 +++++++ .../models/anthropic/claude-3-5-sonnet.toml | 22 ++++++ .../anthropic/claude-3-7-sonnet-20250219.toml | 23 +++++++ .../models/anthropic/claude-3-7-sonnet.toml | 23 +++++++ .../models/anthropic/claude-3-haiku.toml | 23 +++++++ .../models/anthropic/claude-3-opus.toml | 23 +++++++ .../anthropic/claude-haiku-4-5-20251001.toml | 23 +++++++ .../models/anthropic/claude-haiku-4-5.toml | 23 +++++++ .../anthropic/claude-opus-4-1-20250805.toml | 23 +++++++ .../anthropic/claude-opus-4-20250514.toml | 22 ++++++ .../anthropic/claude-opus-4-5-20251101.toml | 23 +++++++ .../anthropic/claude-sonnet-4-20250514.toml | 22 ++++++ .../anthropic/claude-sonnet-4-5-20250929.toml | 23 +++++++ .../models/anthropic/claude-sonnet-4-5.toml | 23 +++++++ .../models/bytedance/seed-1-6-250615.toml | 22 ++++++ .../models/bytedance/seed-1-6-250915.toml | 22 ++++++ .../bytedance/seed-1-6-flash-250715.toml | 22 ++++++ .../models/bytedance/seed-1-8-251228.toml | 22 ++++++ .../models/bytedance/seedream-4-0.toml | 22 ++++++ .../models/bytedance/seedream-4-5.toml | 22 ++++++ .../models/deepseek/deepseek-r1-0528.toml | 22 ++++++ .../deepseek/deepseek-r1t2-chimera-free.toml | 21 ++++++ .../models/deepseek/deepseek-v3.1.toml | 23 +++++++ .../models/deepseek/deepseek-v3.2.toml | 22 ++++++ .../models/deepseek/deepseek-v3.toml | 21 ++++++ .../models/google/gemini-2.0-flash-lite.toml | 21 ++++++ .../models/google/gemini-2.0-flash.toml | 21 ++++++ .../gemini-2.5-flash-image-preview.toml | 22 ++++++ .../models/google/gemini-2.5-flash-image.toml | 22 ++++++ ...gemini-2.5-flash-lite-preview-09-2025.toml | 22 ++++++ .../models/google/gemini-2.5-flash-lite.toml | 22 ++++++ .../gemini-2.5-flash-preview-09-2025.toml | 22 ++++++ .../models/google/gemini-2.5-flash.toml | 22 ++++++ .../models/google/gemini-2.5-pro.toml | 21 ++++++ .../models/google/gemini-3-flash-preview.toml | 22 ++++++ .../google/gemini-3-pro-image-preview.toml | 22 ++++++ .../models/google/gemini-3-pro-preview.toml | 22 ++++++ .../google/gemma-2-27b-it-together.toml | 21 ++++++ .../models/google/gemma-3-12b-it.toml | 21 ++++++ .../models/google/gemma-3-1b-it.toml | 21 ++++++ .../llmgateway/models/google/gemma-3-27b.toml | 21 ++++++ .../models/google/gemma-3-4b-it.toml | 21 ++++++ .../models/google/gemma-3n-e2b-it.toml | 21 ++++++ .../models/google/gemma-3n-e4b-it.toml | 21 ++++++ .../llmgateway/models/llmgateway/auto.toml | 21 ++++++ .../llmgateway/models/llmgateway/custom.toml | 21 ++++++ .../models/meta/llama-3.1-70b-instruct.toml | 23 +++++++ .../models/meta/llama-3.1-8b-instruct.toml | 23 +++++++ .../meta/llama-3.1-nemotron-ultra-253b.toml | 21 ++++++ .../models/meta/llama-3.2-11b-instruct.toml | 22 ++++++ .../meta/llama-3.3-70b-instruct-free.toml | 21 ++++++ .../models/meta/llama-3.3-70b-instruct.toml | 21 ++++++ .../meta/llama-4-maverick-17b-instruct.toml | 23 +++++++ .../models/meta/llama-4-maverick-free.toml | 21 ++++++ .../meta/llama-4-scout-17b-instruct.toml | 23 +++++++ .../models/meta/llama-4-scout-free.toml | 21 ++++++ .../llmgateway/models/meta/llama-4-scout.toml | 22 ++++++ .../models/meta/llama-guard-4-12b.toml | 21 ++++++ .../models/minimax/minimax-m2.1.toml | 23 +++++++ .../models/mistral/mistral-large-latest.toml | 21 ++++++ .../mixtral-8x7b-instruct-together.toml | 21 ++++++ .../models/mistral/pixtral-large-latest.toml | 21 ++++++ .../models/moonshot/kimi-k2-0905-free.toml | 21 ++++++ .../moonshot/kimi-k2-thinking-turbo.toml | 23 +++++++ .../models/moonshot/kimi-k2-thinking.toml | 23 +++++++ .../llmgateway/models/moonshot/kimi-k2.toml | 23 +++++++ .../models/nvidia/nemotron-nano-9b-v2.toml | 21 ++++++ .../models/openai/gpt-3.5-turbo.toml | 21 ++++++ .../llmgateway/models/openai/gpt-4-turbo.toml | 21 ++++++ .../models/openai/gpt-4.1-mini.toml | 21 ++++++ .../models/openai/gpt-4.1-nano.toml | 21 ++++++ .../llmgateway/models/openai/gpt-4.1.toml | 21 ++++++ providers/llmgateway/models/openai/gpt-4.toml | 22 ++++++ .../openai/gpt-4o-mini-search-preview.toml | 22 ++++++ .../llmgateway/models/openai/gpt-4o-mini.toml | 23 +++++++ .../models/openai/gpt-4o-search-preview.toml | 22 ++++++ .../llmgateway/models/openai/gpt-4o.toml | 23 +++++++ .../models/openai/gpt-5-chat-latest.toml | 23 +++++++ .../llmgateway/models/openai/gpt-5-mini.toml | 23 +++++++ .../llmgateway/models/openai/gpt-5-nano.toml | 23 +++++++ .../llmgateway/models/openai/gpt-5-pro.toml | 22 ++++++ .../models/openai/gpt-5.1-codex-mini.toml | 23 +++++++ .../models/openai/gpt-5.1-codex.toml | 22 ++++++ .../llmgateway/models/openai/gpt-5.1.toml | 23 +++++++ .../models/openai/gpt-5.2-chat-latest.toml | 23 +++++++ .../llmgateway/models/openai/gpt-5.2-pro.toml | 22 ++++++ .../llmgateway/models/openai/gpt-5.2.toml | 23 +++++++ providers/llmgateway/models/openai/gpt-5.toml | 23 +++++++ .../models/openai/gpt-oss-120b.toml | 22 ++++++ .../models/openai/gpt-oss-20b-free.toml | 21 ++++++ .../llmgateway/models/openai/gpt-oss-20b.toml | 22 ++++++ .../llmgateway/models/openai/o1-mini.toml | 22 ++++++ providers/llmgateway/models/openai/o1.toml | 21 ++++++ .../llmgateway/models/openai/o3-mini.toml | 21 ++++++ providers/llmgateway/models/openai/o3.toml | 21 ++++++ .../models/perplexity/sonar-pro.toml | 21 ++++++ .../perplexity/sonar-reasoning-pro.toml | 21 ++++++ .../llmgateway/models/perplexity/sonar.toml | 21 ++++++ .../llmgateway/models/xai/grok-3-mini.toml | 21 ++++++ providers/llmgateway/models/xai/grok-3.toml | 21 ++++++ .../llmgateway/models/xai/grok-4-0709.toml | 22 ++++++ .../xai/grok-4-1-fast-non-reasoning.toml | 21 ++++++ .../models/xai/grok-4-1-fast-reasoning.toml | 21 ++++++ .../models/xai/grok-4-fast-non-reasoning.toml | 22 ++++++ .../models/xai/grok-4-fast-reasoning.toml | 22 ++++++ providers/llmgateway/models/xai/grok-4.toml | 22 ++++++ .../models/xai/grok-code-fast-1.toml | 22 ++++++ .../llmgateway/models/zai/cogview-4.toml | 22 ++++++ .../models/zai/glm-4-32b-0414-128k.toml | 21 ++++++ .../models/zai/glm-4.5-air-free.toml | 21 ++++++ .../llmgateway/models/zai/glm-4.5-air.toml | 22 ++++++ .../llmgateway/models/zai/glm-4.5-airx.toml | 22 ++++++ .../llmgateway/models/zai/glm-4.5-flash.toml | 21 ++++++ .../llmgateway/models/zai/glm-4.5-x.toml | 23 +++++++ providers/llmgateway/models/zai/glm-4.5.toml | 22 ++++++ providers/llmgateway/models/zai/glm-4.5v.toml | 23 +++++++ providers/llmgateway/models/zai/glm-4.6.toml | 22 ++++++ .../llmgateway/models/zai/glm-4.6v-flash.toml | 22 ++++++ .../models/zai/glm-4.6v-flashx.toml | 23 +++++++ providers/llmgateway/models/zai/glm-4.6v.toml | 23 +++++++ .../llmgateway/models/zai/glm-4.7-flash.toml | 22 ++++++ .../llmgateway/models/zai/glm-4.7-flashx.toml | 23 +++++++ providers/llmgateway/models/zai/glm-4.7.toml | 23 +++++++ .../llmgateway/models/zai/glm-image.toml | 22 ++++++ providers/llmgateway/provider.toml | 5 ++ providers/llmgateway/scripts/generate.ts | 11 +++ 157 files changed, 3453 insertions(+) create mode 100644 providers/llmgateway/README.md create mode 100644 providers/llmgateway/logo.svg create mode 100644 providers/llmgateway/models/alibaba/qwen-flash.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-image-max-2025-12-30.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-image-max.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-image-plus.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-image.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-max-latest.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-max.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-omni-turbo.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-plus-latest.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-plus.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-turbo.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-vl-max.toml create mode 100644 providers/llmgateway/models/alibaba/qwen-vl-plus.toml create mode 100644 providers/llmgateway/models/alibaba/qwen2-5-vl-72b-instruct.toml create mode 100644 providers/llmgateway/models/alibaba/qwen25-coder-7b.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-235b-a22b-instruct-2507.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-235b-a22b-thinking-2507.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-30b-a3b-instruct-2507.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-30b-a3b-thinking-2507.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-32b.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-coder-30b-a3b-instruct.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-coder-480b-a35b-instruct.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-coder-plus.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-coder.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-max.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-instruct.toml create mode 100644 providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-thinking.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-5-haiku-20241022.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-5-haiku.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-5-sonnet-20240620.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-5-sonnet.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-7-sonnet-20250219.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-7-sonnet.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-haiku.toml create mode 100644 providers/llmgateway/models/anthropic/claude-3-opus.toml create mode 100644 providers/llmgateway/models/anthropic/claude-haiku-4-5-20251001.toml create mode 100644 providers/llmgateway/models/anthropic/claude-haiku-4-5.toml create mode 100644 providers/llmgateway/models/anthropic/claude-opus-4-1-20250805.toml create mode 100644 providers/llmgateway/models/anthropic/claude-opus-4-20250514.toml create mode 100644 providers/llmgateway/models/anthropic/claude-opus-4-5-20251101.toml create mode 100644 providers/llmgateway/models/anthropic/claude-sonnet-4-20250514.toml create mode 100644 providers/llmgateway/models/anthropic/claude-sonnet-4-5-20250929.toml create mode 100644 providers/llmgateway/models/anthropic/claude-sonnet-4-5.toml create mode 100644 providers/llmgateway/models/bytedance/seed-1-6-250615.toml create mode 100644 providers/llmgateway/models/bytedance/seed-1-6-250915.toml create mode 100644 providers/llmgateway/models/bytedance/seed-1-6-flash-250715.toml create mode 100644 providers/llmgateway/models/bytedance/seed-1-8-251228.toml create mode 100644 providers/llmgateway/models/bytedance/seedream-4-0.toml create mode 100644 providers/llmgateway/models/bytedance/seedream-4-5.toml create mode 100644 providers/llmgateway/models/deepseek/deepseek-r1-0528.toml create mode 100644 providers/llmgateway/models/deepseek/deepseek-r1t2-chimera-free.toml create mode 100644 providers/llmgateway/models/deepseek/deepseek-v3.1.toml create mode 100644 providers/llmgateway/models/deepseek/deepseek-v3.2.toml create mode 100644 providers/llmgateway/models/deepseek/deepseek-v3.toml create mode 100644 providers/llmgateway/models/google/gemini-2.0-flash-lite.toml create mode 100644 providers/llmgateway/models/google/gemini-2.0-flash.toml create mode 100644 providers/llmgateway/models/google/gemini-2.5-flash-image-preview.toml create mode 100644 providers/llmgateway/models/google/gemini-2.5-flash-image.toml create mode 100644 providers/llmgateway/models/google/gemini-2.5-flash-lite-preview-09-2025.toml create mode 100644 providers/llmgateway/models/google/gemini-2.5-flash-lite.toml create mode 100644 providers/llmgateway/models/google/gemini-2.5-flash-preview-09-2025.toml create mode 100644 providers/llmgateway/models/google/gemini-2.5-flash.toml create mode 100644 providers/llmgateway/models/google/gemini-2.5-pro.toml create mode 100644 providers/llmgateway/models/google/gemini-3-flash-preview.toml create mode 100644 providers/llmgateway/models/google/gemini-3-pro-image-preview.toml create mode 100644 providers/llmgateway/models/google/gemini-3-pro-preview.toml create mode 100644 providers/llmgateway/models/google/gemma-2-27b-it-together.toml create mode 100644 providers/llmgateway/models/google/gemma-3-12b-it.toml create mode 100644 providers/llmgateway/models/google/gemma-3-1b-it.toml create mode 100644 providers/llmgateway/models/google/gemma-3-27b.toml create mode 100644 providers/llmgateway/models/google/gemma-3-4b-it.toml create mode 100644 providers/llmgateway/models/google/gemma-3n-e2b-it.toml create mode 100644 providers/llmgateway/models/google/gemma-3n-e4b-it.toml create mode 100644 providers/llmgateway/models/llmgateway/auto.toml create mode 100644 providers/llmgateway/models/llmgateway/custom.toml create mode 100644 providers/llmgateway/models/meta/llama-3.1-70b-instruct.toml create mode 100644 providers/llmgateway/models/meta/llama-3.1-8b-instruct.toml create mode 100644 providers/llmgateway/models/meta/llama-3.1-nemotron-ultra-253b.toml create mode 100644 providers/llmgateway/models/meta/llama-3.2-11b-instruct.toml create mode 100644 providers/llmgateway/models/meta/llama-3.3-70b-instruct-free.toml create mode 100644 providers/llmgateway/models/meta/llama-3.3-70b-instruct.toml create mode 100644 providers/llmgateway/models/meta/llama-4-maverick-17b-instruct.toml create mode 100644 providers/llmgateway/models/meta/llama-4-maverick-free.toml create mode 100644 providers/llmgateway/models/meta/llama-4-scout-17b-instruct.toml create mode 100644 providers/llmgateway/models/meta/llama-4-scout-free.toml create mode 100644 providers/llmgateway/models/meta/llama-4-scout.toml create mode 100644 providers/llmgateway/models/meta/llama-guard-4-12b.toml create mode 100644 providers/llmgateway/models/minimax/minimax-m2.1.toml create mode 100644 providers/llmgateway/models/mistral/mistral-large-latest.toml create mode 100644 providers/llmgateway/models/mistral/mixtral-8x7b-instruct-together.toml create mode 100644 providers/llmgateway/models/mistral/pixtral-large-latest.toml create mode 100644 providers/llmgateway/models/moonshot/kimi-k2-0905-free.toml create mode 100644 providers/llmgateway/models/moonshot/kimi-k2-thinking-turbo.toml create mode 100644 providers/llmgateway/models/moonshot/kimi-k2-thinking.toml create mode 100644 providers/llmgateway/models/moonshot/kimi-k2.toml create mode 100644 providers/llmgateway/models/nvidia/nemotron-nano-9b-v2.toml create mode 100644 providers/llmgateway/models/openai/gpt-3.5-turbo.toml create mode 100644 providers/llmgateway/models/openai/gpt-4-turbo.toml create mode 100644 providers/llmgateway/models/openai/gpt-4.1-mini.toml create mode 100644 providers/llmgateway/models/openai/gpt-4.1-nano.toml create mode 100644 providers/llmgateway/models/openai/gpt-4.1.toml create mode 100644 providers/llmgateway/models/openai/gpt-4.toml create mode 100644 providers/llmgateway/models/openai/gpt-4o-mini-search-preview.toml create mode 100644 providers/llmgateway/models/openai/gpt-4o-mini.toml create mode 100644 providers/llmgateway/models/openai/gpt-4o-search-preview.toml create mode 100644 providers/llmgateway/models/openai/gpt-4o.toml create mode 100644 providers/llmgateway/models/openai/gpt-5-chat-latest.toml create mode 100644 providers/llmgateway/models/openai/gpt-5-mini.toml create mode 100644 providers/llmgateway/models/openai/gpt-5-nano.toml create mode 100644 providers/llmgateway/models/openai/gpt-5-pro.toml create mode 100644 providers/llmgateway/models/openai/gpt-5.1-codex-mini.toml create mode 100644 providers/llmgateway/models/openai/gpt-5.1-codex.toml create mode 100644 providers/llmgateway/models/openai/gpt-5.1.toml create mode 100644 providers/llmgateway/models/openai/gpt-5.2-chat-latest.toml create mode 100644 providers/llmgateway/models/openai/gpt-5.2-pro.toml create mode 100644 providers/llmgateway/models/openai/gpt-5.2.toml create mode 100644 providers/llmgateway/models/openai/gpt-5.toml create mode 100644 providers/llmgateway/models/openai/gpt-oss-120b.toml create mode 100644 providers/llmgateway/models/openai/gpt-oss-20b-free.toml create mode 100644 providers/llmgateway/models/openai/gpt-oss-20b.toml create mode 100644 providers/llmgateway/models/openai/o1-mini.toml create mode 100644 providers/llmgateway/models/openai/o1.toml create mode 100644 providers/llmgateway/models/openai/o3-mini.toml create mode 100644 providers/llmgateway/models/openai/o3.toml create mode 100644 providers/llmgateway/models/perplexity/sonar-pro.toml create mode 100644 providers/llmgateway/models/perplexity/sonar-reasoning-pro.toml create mode 100644 providers/llmgateway/models/perplexity/sonar.toml create mode 100644 providers/llmgateway/models/xai/grok-3-mini.toml create mode 100644 providers/llmgateway/models/xai/grok-3.toml create mode 100644 providers/llmgateway/models/xai/grok-4-0709.toml create mode 100644 providers/llmgateway/models/xai/grok-4-1-fast-non-reasoning.toml create mode 100644 providers/llmgateway/models/xai/grok-4-1-fast-reasoning.toml create mode 100644 providers/llmgateway/models/xai/grok-4-fast-non-reasoning.toml create mode 100644 providers/llmgateway/models/xai/grok-4-fast-reasoning.toml create mode 100644 providers/llmgateway/models/xai/grok-4.toml create mode 100644 providers/llmgateway/models/xai/grok-code-fast-1.toml create mode 100644 providers/llmgateway/models/zai/cogview-4.toml create mode 100644 providers/llmgateway/models/zai/glm-4-32b-0414-128k.toml create mode 100644 providers/llmgateway/models/zai/glm-4.5-air-free.toml create mode 100644 providers/llmgateway/models/zai/glm-4.5-air.toml create mode 100644 providers/llmgateway/models/zai/glm-4.5-airx.toml create mode 100644 providers/llmgateway/models/zai/glm-4.5-flash.toml create mode 100644 providers/llmgateway/models/zai/glm-4.5-x.toml create mode 100644 providers/llmgateway/models/zai/glm-4.5.toml create mode 100644 providers/llmgateway/models/zai/glm-4.5v.toml create mode 100644 providers/llmgateway/models/zai/glm-4.6.toml create mode 100644 providers/llmgateway/models/zai/glm-4.6v-flash.toml create mode 100644 providers/llmgateway/models/zai/glm-4.6v-flashx.toml create mode 100644 providers/llmgateway/models/zai/glm-4.6v.toml create mode 100644 providers/llmgateway/models/zai/glm-4.7-flash.toml create mode 100644 providers/llmgateway/models/zai/glm-4.7-flashx.toml create mode 100644 providers/llmgateway/models/zai/glm-4.7.toml create mode 100644 providers/llmgateway/models/zai/glm-image.toml create mode 100644 providers/llmgateway/provider.toml create mode 100644 providers/llmgateway/scripts/generate.ts diff --git a/providers/llmgateway/README.md b/providers/llmgateway/README.md new file mode 100644 index 000000000..8292fff56 --- /dev/null +++ b/providers/llmgateway/README.md @@ -0,0 +1,68 @@ +# LLM Gateway Provider + +This provider enables access to 150+ AI models through [LLM Gateway](https://llmgateway.io), an OpenAI-compatible API gateway that provides unified access to 40+ LLM providers. + +## Directory Structure + +- **models/**: TOML configuration files organized by upstream provider + - **anthropic/**: Claude models + - **openai/**: GPT and o-series models + - **google/**: Gemini and Gemma models + - **meta/**: Llama models + - **xai/**: Grok models + - **deepseek/**: DeepSeek models + - **alibaba/**: Qwen models + - **mistral/**: Mistral and Mixtral models + - **zai/**: GLM models + - **llmgateway/**: LLM Gateway native models (auto-routing) + - And more... +- **scripts/**: Scripts for generating model configurations +- **provider.toml**: Provider configuration + +## How It Works + +LLM Gateway acts as a unified proxy for multiple AI providers. You can access any supported model through a single API endpoint using your LLM Gateway API key. + +## Prerequisites + +```bash +export LLMGATEWAY_API_KEY="your-api-key" +``` + +## Supported Providers + +- OpenAI (GPT-3.5, GPT-4, GPT-4o, GPT-5, o1, o3, o4-mini) +- Anthropic (Claude 3, 3.5, 3.7, 4, 4.5) +- Google (Gemini 1.5, 2.0, 2.5, 3, Gemma) +- Meta (Llama 3.1, 3.3, 4) +- xAI (Grok 2, 3, 4) +- DeepSeek (V3, R1) +- Alibaba (Qwen Max, Plus, Flash, VL, Coder) +- Mistral (Large, Pixtral, Mixtral) +- ZAI (GLM 4.5, 4.6, 4.7) +- ByteDance (Seed, Seedream) +- Moonshot (Kimi K2) +- Perplexity (Sonar) +- And many more... + +## Usage with AI SDK + +```typescript +import { createOpenAICompatible } from "@ai-sdk/openai-compatible"; + +const llmgateway = createOpenAICompatible({ + baseURL: "https://api.llmgateway.io/v1", + apiKey: process.env.LLMGATEWAY_API_KEY, +}); + +const result = await generateText({ + model: llmgateway("claude-sonnet-4-5"), + prompt: "Hello!", +}); +``` + +## Links + +- [Documentation](https://llmgateway.io/docs) +- [Pricing](https://llmgateway.io/pricing) +- [GitHub](https://github.com/theopenco/llmgateway) diff --git a/providers/llmgateway/logo.svg b/providers/llmgateway/logo.svg new file mode 100644 index 000000000..77135ce4f --- /dev/null +++ b/providers/llmgateway/logo.svg @@ -0,0 +1,4 @@ + + + + diff --git a/providers/llmgateway/models/alibaba/qwen-flash.toml b/providers/llmgateway/models/alibaba/qwen-flash.toml new file mode 100644 index 000000000..e09911f57 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-flash.toml @@ -0,0 +1,22 @@ +name = "Qwen Flash" +family = "qwen" +release_date = "2024-09-09" +last_updated = "2024-09-09" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.05 +output = 0.40 + +[limit] +context = 1_000_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-image-max-2025-12-30.toml b/providers/llmgateway/models/alibaba/qwen-image-max-2025-12-30.toml new file mode 100644 index 000000000..83b4c97f9 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-image-max-2025-12-30.toml @@ -0,0 +1,22 @@ +name = "Qwen Image Max 2025-12-30" +family = "qwen" +release_date = "2025-12-31" +last_updated = "2025-12-31" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-image-max.toml b/providers/llmgateway/models/alibaba/qwen-image-max.toml new file mode 100644 index 000000000..c7d114a03 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-image-max.toml @@ -0,0 +1,22 @@ +name = "Qwen Image Max" +family = "qwen" +release_date = "2025-08-04" +last_updated = "2025-08-04" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-image-plus.toml b/providers/llmgateway/models/alibaba/qwen-image-plus.toml new file mode 100644 index 000000000..c0078bcc3 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-image-plus.toml @@ -0,0 +1,22 @@ +name = "Qwen Image Plus" +family = "qwen" +release_date = "2025-08-04" +last_updated = "2025-08-04" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-image.toml b/providers/llmgateway/models/alibaba/qwen-image.toml new file mode 100644 index 000000000..2024a02a8 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-image.toml @@ -0,0 +1,22 @@ +name = "Qwen Image" +family = "qwen" +release_date = "2025-08-04" +last_updated = "2025-08-04" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-max-latest.toml b/providers/llmgateway/models/alibaba/qwen-max-latest.toml new file mode 100644 index 000000000..c65a8894c --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-max-latest.toml @@ -0,0 +1,22 @@ +name = "Qwen Max Latest" +family = "qwen" +release_date = "2025-01-25" +last_updated = "2025-01-25" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 1.60 +output = 6.40 + +[limit] +context = 131_072 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-max.toml b/providers/llmgateway/models/alibaba/qwen-max.toml new file mode 100644 index 000000000..3207ded01 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-max.toml @@ -0,0 +1,22 @@ +name = "Qwen Max" +family = "qwen" +release_date = "2025-09-05" +last_updated = "2025-09-05" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 1.60 +output = 6.40 + +[limit] +context = 131_072 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-omni-turbo.toml b/providers/llmgateway/models/alibaba/qwen-omni-turbo.toml new file mode 100644 index 000000000..d871d81aa --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-omni-turbo.toml @@ -0,0 +1,22 @@ +name = "Qwen Omni Turbo" +family = "qwen" +release_date = "2025-03-26" +last_updated = "2025-03-26" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.20 +output = 0.80 + +[limit] +context = 32_768 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-plus-latest.toml b/providers/llmgateway/models/alibaba/qwen-plus-latest.toml new file mode 100644 index 000000000..5da8f1be9 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-plus-latest.toml @@ -0,0 +1,22 @@ +name = "Qwen Plus Latest" +family = "qwen" +release_date = "2024-09-09" +last_updated = "2024-09-09" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.40 +output = 1.20 + +[limit] +context = 1_000_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-plus.toml b/providers/llmgateway/models/alibaba/qwen-plus.toml new file mode 100644 index 000000000..a41679ac6 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-plus.toml @@ -0,0 +1,22 @@ +name = "Qwen Plus" +family = "qwen" +release_date = "2025-01-25" +last_updated = "2025-01-25" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.40 +output = 1.20 + +[limit] +context = 131_072 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-turbo.toml b/providers/llmgateway/models/alibaba/qwen-turbo.toml new file mode 100644 index 000000000..975c2315b --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-turbo.toml @@ -0,0 +1,22 @@ +name = "Qwen Turbo" +family = "qwen" +release_date = "2025-02-01" +last_updated = "2025-02-01" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.05 +output = 0.20 + +[limit] +context = 1_000_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-vl-max.toml b/providers/llmgateway/models/alibaba/qwen-vl-max.toml new file mode 100644 index 000000000..53a7cdef3 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-vl-max.toml @@ -0,0 +1,22 @@ +name = "Qwen VL Max" +family = "qwen" +release_date = "2025-02-01" +last_updated = "2025-02-01" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.80 +output = 3.20 + +[limit] +context = 131_072 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen-vl-plus.toml b/providers/llmgateway/models/alibaba/qwen-vl-plus.toml new file mode 100644 index 000000000..ea6262368 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen-vl-plus.toml @@ -0,0 +1,22 @@ +name = "Qwen VL Plus" +family = "qwen" +release_date = "2025-02-05" +last_updated = "2025-02-05" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.21 +output = 0.64 + +[limit] +context = 131_072 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen2-5-vl-72b-instruct.toml b/providers/llmgateway/models/alibaba/qwen2-5-vl-72b-instruct.toml new file mode 100644 index 000000000..950838ae5 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen2-5-vl-72b-instruct.toml @@ -0,0 +1,22 @@ +name = "Qwen2.5 VL 72B Instruct" +family = "qwen" +release_date = "2025-01-26" +last_updated = "2025-01-26" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.13 +output = 0.40 + +[limit] +context = 32_768 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen25-coder-7b.toml b/providers/llmgateway/models/alibaba/qwen25-coder-7b.toml new file mode 100644 index 000000000..d297f6571 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen25-coder-7b.toml @@ -0,0 +1,22 @@ +name = "Qwen2.5 Coder 7B" +family = "qwen" +release_date = "2024-09-19" +last_updated = "2024-09-19" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.01 +output = 0.03 + +[limit] +context = 32_768 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-235b-a22b-instruct-2507.toml b/providers/llmgateway/models/alibaba/qwen3-235b-a22b-instruct-2507.toml new file mode 100644 index 000000000..4386b79bf --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-235b-a22b-instruct-2507.toml @@ -0,0 +1,23 @@ +name = "Qwen3 235B A22B Instruct 2507" +family = "qwen" +release_date = "2025-07-21" +last_updated = "2025-07-21" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true +status = "beta" + +[cost] +input = 0.20 +output = 0.60 + +[limit] +context = 262_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-235b-a22b-thinking-2507.toml b/providers/llmgateway/models/alibaba/qwen3-235b-a22b-thinking-2507.toml new file mode 100644 index 000000000..fbce668d1 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-235b-a22b-thinking-2507.toml @@ -0,0 +1,23 @@ +name = "Qwen3 235B A22B Thinking 2507" +family = "qwen" +release_date = "2025-07-25" +last_updated = "2025-07-25" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true +status = "beta" + +[cost] +input = 0.20 +output = 0.60 + +[limit] +context = 262_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-30b-a3b-instruct-2507.toml b/providers/llmgateway/models/alibaba/qwen3-30b-a3b-instruct-2507.toml new file mode 100644 index 000000000..82d13f7b0 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-30b-a3b-instruct-2507.toml @@ -0,0 +1,22 @@ +name = "Qwen3 30B A3B Instruct 2507" +family = "qwen" +release_date = "2025-07-30" +last_updated = "2025-07-30" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.10 +output = 0.30 + +[limit] +context = 262_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-30b-a3b-thinking-2507.toml b/providers/llmgateway/models/alibaba/qwen3-30b-a3b-thinking-2507.toml new file mode 100644 index 000000000..4589eb5ce --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-30b-a3b-thinking-2507.toml @@ -0,0 +1,22 @@ +name = "Qwen3 30B A3B Thinking 2507" +family = "qwen" +release_date = "2025-07-30" +last_updated = "2025-07-30" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.10 +output = 0.30 + +[limit] +context = 262_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-32b.toml b/providers/llmgateway/models/alibaba/qwen3-32b.toml new file mode 100644 index 000000000..a19495067 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-32b.toml @@ -0,0 +1,22 @@ +name = "Qwen3 32B" +family = "qwen" +release_date = "2025-04-28" +last_updated = "2025-04-28" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.10 +output = 0.30 + +[limit] +context = 32_768 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-coder-30b-a3b-instruct.toml b/providers/llmgateway/models/alibaba/qwen3-coder-30b-a3b-instruct.toml new file mode 100644 index 000000000..d6110d145 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-coder-30b-a3b-instruct.toml @@ -0,0 +1,22 @@ +name = "Qwen3 Coder 30B A3B Instruct" +family = "qwen" +release_date = "2025-07-31" +last_updated = "2025-07-31" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.10 +output = 0.30 + +[limit] +context = 262_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-coder-480b-a35b-instruct.toml b/providers/llmgateway/models/alibaba/qwen3-coder-480b-a35b-instruct.toml new file mode 100644 index 000000000..698cd1a1b --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-coder-480b-a35b-instruct.toml @@ -0,0 +1,22 @@ +name = "Qwen3 Coder 480B A35B Instruct" +family = "qwen" +release_date = "2025-01-31" +last_updated = "2025-01-31" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.40 +output = 1.80 + +[limit] +context = 262_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-coder-plus.toml b/providers/llmgateway/models/alibaba/qwen3-coder-plus.toml new file mode 100644 index 000000000..6817f6e73 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-coder-plus.toml @@ -0,0 +1,22 @@ +name = "Qwen3 Coder Plus" +family = "qwen" +release_date = "2025-09-23" +last_updated = "2025-09-23" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 6.00 +output = 60.00 + +[limit] +context = 1_000_000 +output = 66_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-coder.toml b/providers/llmgateway/models/alibaba/qwen3-coder.toml new file mode 100644 index 000000000..ff536a2fc --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-coder.toml @@ -0,0 +1,22 @@ +name = "Qwen3 Coder" +family = "qwen" +release_date = "2025-07-23" +last_updated = "2025-07-23" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.22 +output = 0.95 + +[limit] +context = 262_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-max.toml b/providers/llmgateway/models/alibaba/qwen3-max.toml new file mode 100644 index 000000000..da79ecf8f --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-max.toml @@ -0,0 +1,23 @@ +name = "Qwen3 Max" +family = "qwen" +release_date = "2025-09-24" +last_updated = "2025-09-24" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.60 + +[limit] +context = 256_000 +output = 32_800 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-instruct.toml b/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-instruct.toml new file mode 100644 index 000000000..8827c2e00 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-instruct.toml @@ -0,0 +1,22 @@ +name = "Qwen3 Next 80B A3B Instruct" +family = "qwen" +release_date = "2025-09-10" +last_updated = "2025-09-10" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.50 +output = 2.00 + +[limit] +context = 129_024 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-thinking.toml b/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-thinking.toml new file mode 100644 index 000000000..ca4b46a01 --- /dev/null +++ b/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-thinking.toml @@ -0,0 +1,23 @@ +name = "Qwen3 Next 80B A3B Thinking" +family = "qwen" +release_date = "2025-09-10" +last_updated = "2025-09-10" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = false +open_weights = true +status = "beta" + +[cost] +input = 0.50 +output = 6.00 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-5-haiku-20241022.toml b/providers/llmgateway/models/anthropic/claude-3-5-haiku-20241022.toml new file mode 100644 index 000000000..f36e5c2f8 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-5-haiku-20241022.toml @@ -0,0 +1,24 @@ +name = "Claude 3.5 Haiku (2024-10-22)" +family = "claude" +release_date = "2024-10-22" +last_updated = "2024-10-22" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = false +status = "deprecated" + +[cost] +input = 0.80 +output = 4.00 +cache_read = 0.08 + +[limit] +context = 200_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-5-haiku.toml b/providers/llmgateway/models/anthropic/claude-3-5-haiku.toml new file mode 100644 index 000000000..cbe510f64 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-5-haiku.toml @@ -0,0 +1,23 @@ +name = "Claude 3.5 Haiku" +family = "claude" +release_date = "2024-10-22" +last_updated = "2024-10-22" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 0.80 +output = 4.00 +cache_read = 0.08 + +[limit] +context = 200_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-5-sonnet-20240620.toml b/providers/llmgateway/models/anthropic/claude-3-5-sonnet-20240620.toml new file mode 100644 index 000000000..70e49ed5f --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-5-sonnet-20240620.toml @@ -0,0 +1,23 @@ +name = "Claude 3.5 Sonnet (Old)" +family = "claude" +release_date = "2024-06-20" +last_updated = "2024-06-20" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 + +[limit] +context = 200_000 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-5-sonnet.toml b/providers/llmgateway/models/anthropic/claude-3-5-sonnet.toml new file mode 100644 index 000000000..0990095d4 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-5-sonnet.toml @@ -0,0 +1,22 @@ +name = "Claude 3.5 Sonnet" +family = "claude" +release_date = "2024-06-20" +last_updated = "2024-06-20" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 + +[limit] +context = 200_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-7-sonnet-20250219.toml b/providers/llmgateway/models/anthropic/claude-3-7-sonnet-20250219.toml new file mode 100644 index 000000000..1572e751b --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-7-sonnet-20250219.toml @@ -0,0 +1,23 @@ +name = "Claude 3.7 Sonnet (2025-02-19)" +family = "claude" +release_date = "2025-02-19" +last_updated = "2025-02-19" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 + +[limit] +context = 200_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-7-sonnet.toml b/providers/llmgateway/models/anthropic/claude-3-7-sonnet.toml new file mode 100644 index 000000000..3800cc12f --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-7-sonnet.toml @@ -0,0 +1,23 @@ +name = "Claude 3.7 Sonnet" +family = "claude" +release_date = "2025-02-24" +last_updated = "2025-02-24" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 + +[limit] +context = 200_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-haiku.toml b/providers/llmgateway/models/anthropic/claude-3-haiku.toml new file mode 100644 index 000000000..67494e981 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-haiku.toml @@ -0,0 +1,23 @@ +name = "Claude 3 Haiku" +family = "claude" +release_date = "2024-03-04" +last_updated = "2024-03-04" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 0.25 +output = 1.25 +cache_read = 0.03 + +[limit] +context = 200_000 +output = 4_096 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-3-opus.toml b/providers/llmgateway/models/anthropic/claude-3-opus.toml new file mode 100644 index 000000000..8cf509623 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-3-opus.toml @@ -0,0 +1,23 @@ +name = "Claude 3 Opus" +family = "claude" +release_date = "2024-03-04" +last_updated = "2024-03-04" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 15.00 +output = 75.00 +cache_read = 1.50 + +[limit] +context = 200_000 +output = 4_096 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-haiku-4-5-20251001.toml b/providers/llmgateway/models/anthropic/claude-haiku-4-5-20251001.toml new file mode 100644 index 000000000..8b1cf8cb2 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-haiku-4-5-20251001.toml @@ -0,0 +1,23 @@ +name = "Claude Haiku 4.5 (2025-10-01)" +family = "claude" +release_date = "2025-10-15" +last_updated = "2025-10-15" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.00 +output = 5.00 +cache_read = 0.10 + +[limit] +context = 200_000 +output = 64_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-haiku-4-5.toml b/providers/llmgateway/models/anthropic/claude-haiku-4-5.toml new file mode 100644 index 000000000..61c4fb842 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-haiku-4-5.toml @@ -0,0 +1,23 @@ +name = "Claude Haiku 4.5" +family = "claude" +release_date = "2025-10-15" +last_updated = "2025-10-15" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.00 +output = 5.00 +cache_read = 0.10 + +[limit] +context = 200_000 +output = 64_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-opus-4-1-20250805.toml b/providers/llmgateway/models/anthropic/claude-opus-4-1-20250805.toml new file mode 100644 index 000000000..12f7d8575 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-opus-4-1-20250805.toml @@ -0,0 +1,23 @@ +name = "Claude Opus 4.1" +family = "claude" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 15.00 +output = 75.00 +cache_read = 1.50 + +[limit] +context = 200_000 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-opus-4-20250514.toml b/providers/llmgateway/models/anthropic/claude-opus-4-20250514.toml new file mode 100644 index 000000000..5198af3bb --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-opus-4-20250514.toml @@ -0,0 +1,22 @@ +name = "Claude Opus 4 (2025-05-14)" +family = "claude" +release_date = "2025-05-22" +last_updated = "2025-05-22" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 15.00 +output = 75.00 +cache_read = 1.50 + +[limit] +context = 200_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-opus-4-5-20251101.toml b/providers/llmgateway/models/anthropic/claude-opus-4-5-20251101.toml new file mode 100644 index 000000000..5f6f67cc1 --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-opus-4-5-20251101.toml @@ -0,0 +1,23 @@ +name = "Claude Opus 4.5" +family = "claude" +release_date = "2025-11-24" +last_updated = "2025-11-24" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 5.00 +output = 25.00 +cache_read = 0.50 + +[limit] +context = 200_000 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-sonnet-4-20250514.toml b/providers/llmgateway/models/anthropic/claude-sonnet-4-20250514.toml new file mode 100644 index 000000000..f2b6be2ee --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-sonnet-4-20250514.toml @@ -0,0 +1,22 @@ +name = "Claude Sonnet 4 (2025-05-14)" +family = "claude" +release_date = "2025-05-14" +last_updated = "2025-05-14" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 + +[limit] +context = 200_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-sonnet-4-5-20250929.toml b/providers/llmgateway/models/anthropic/claude-sonnet-4-5-20250929.toml new file mode 100644 index 000000000..e638be33a --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-sonnet-4-5-20250929.toml @@ -0,0 +1,23 @@ +name = "Claude Sonnet 4.5 (2025-09-29)" +family = "claude" +release_date = "2025-09-29" +last_updated = "2025-09-29" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 + +[limit] +context = 200_000 +output = 64_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/anthropic/claude-sonnet-4-5.toml b/providers/llmgateway/models/anthropic/claude-sonnet-4-5.toml new file mode 100644 index 000000000..41e19c16b --- /dev/null +++ b/providers/llmgateway/models/anthropic/claude-sonnet-4-5.toml @@ -0,0 +1,23 @@ +name = "Claude Sonnet 4.5" +family = "claude" +release_date = "2025-09-29" +last_updated = "2025-09-29" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 + +[limit] +context = 200_000 +output = 64_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/bytedance/seed-1-6-250615.toml b/providers/llmgateway/models/bytedance/seed-1-6-250615.toml new file mode 100644 index 000000000..5683b7a99 --- /dev/null +++ b/providers/llmgateway/models/bytedance/seed-1-6-250615.toml @@ -0,0 +1,22 @@ +name = "Seed 1.6 (250615)" +family = "bytedance" +release_date = "2025-06-25" +last_updated = "2025-06-25" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.25 +output = 2.00 +cache_read = 0.05 + +[limit] +context = 256_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/bytedance/seed-1-6-250915.toml b/providers/llmgateway/models/bytedance/seed-1-6-250915.toml new file mode 100644 index 000000000..bb37198a3 --- /dev/null +++ b/providers/llmgateway/models/bytedance/seed-1-6-250915.toml @@ -0,0 +1,22 @@ +name = "Seed 1.6 (250915)" +family = "bytedance" +release_date = "2025-09-15" +last_updated = "2025-09-15" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.25 +output = 2.00 +cache_read = 0.05 + +[limit] +context = 256_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/bytedance/seed-1-6-flash-250715.toml b/providers/llmgateway/models/bytedance/seed-1-6-flash-250715.toml new file mode 100644 index 000000000..4d152a0f8 --- /dev/null +++ b/providers/llmgateway/models/bytedance/seed-1-6-flash-250715.toml @@ -0,0 +1,22 @@ +name = "Seed 1.6 Flash (250715)" +family = "bytedance" +release_date = "2025-07-26" +last_updated = "2025-07-26" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.07 +output = 0.30 +cache_read = 0.02 + +[limit] +context = 256_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/bytedance/seed-1-8-251228.toml b/providers/llmgateway/models/bytedance/seed-1-8-251228.toml new file mode 100644 index 000000000..8f6998609 --- /dev/null +++ b/providers/llmgateway/models/bytedance/seed-1-8-251228.toml @@ -0,0 +1,22 @@ +name = "Seed 1.8 (251228)" +family = "bytedance" +release_date = "2025-12-18" +last_updated = "2025-12-18" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.25 +output = 2.00 +cache_read = 0.05 + +[limit] +context = 256_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/bytedance/seedream-4-0.toml b/providers/llmgateway/models/bytedance/seedream-4-0.toml new file mode 100644 index 000000000..54b70ed17 --- /dev/null +++ b/providers/llmgateway/models/bytedance/seedream-4-0.toml @@ -0,0 +1,22 @@ +name = "Seedream 4.0" +family = "bytedance" +release_date = "2025-09-16" +last_updated = "2025-09-16" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/bytedance/seedream-4-5.toml b/providers/llmgateway/models/bytedance/seedream-4-5.toml new file mode 100644 index 000000000..1046c0e67 --- /dev/null +++ b/providers/llmgateway/models/bytedance/seedream-4-5.toml @@ -0,0 +1,22 @@ +name = "Seedream 4.5" +family = "bytedance" +release_date = "2025-12-03" +last_updated = "2025-12-03" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/deepseek/deepseek-r1-0528.toml b/providers/llmgateway/models/deepseek/deepseek-r1-0528.toml new file mode 100644 index 000000000..c5ad7528a --- /dev/null +++ b/providers/llmgateway/models/deepseek/deepseek-r1-0528.toml @@ -0,0 +1,22 @@ +name = "DeepSeek R1 (0528)" +family = "deepseek" +release_date = "2025-05-28" +last_updated = "2025-05-28" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true +status = "beta" + +[cost] +input = 0.25 +output = 1.00 + +[limit] +context = 32_770 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/deepseek/deepseek-r1t2-chimera-free.toml b/providers/llmgateway/models/deepseek/deepseek-r1t2-chimera-free.toml new file mode 100644 index 000000000..a3acc1c18 --- /dev/null +++ b/providers/llmgateway/models/deepseek/deepseek-r1t2-chimera-free.toml @@ -0,0 +1,21 @@ +name = "DeepSeek R1T2 Chimera (Free)" +family = "deepseek" +release_date = "2025-07-08" +last_updated = "2025-07-08" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 163_840 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/deepseek/deepseek-v3.1.toml b/providers/llmgateway/models/deepseek/deepseek-v3.1.toml new file mode 100644 index 000000000..931c90e48 --- /dev/null +++ b/providers/llmgateway/models/deepseek/deepseek-v3.1.toml @@ -0,0 +1,23 @@ +name = "DeepSeek V3.1" +family = "deepseek" +release_date = "2025-08-21" +last_updated = "2025-08-21" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = false +open_weights = true + +[cost] +input = 0.56 +output = 1.68 +cache_read = 0.11 + +[limit] +context = 128_000 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/deepseek/deepseek-v3.2.toml b/providers/llmgateway/models/deepseek/deepseek-v3.2.toml new file mode 100644 index 000000000..7621f7616 --- /dev/null +++ b/providers/llmgateway/models/deepseek/deepseek-v3.2.toml @@ -0,0 +1,22 @@ +name = "DeepSeek V3.2" +family = "deepseek" +release_date = "2025-09-29" +last_updated = "2025-09-29" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.28 +output = 0.42 +cache_read = 0.03 + +[limit] +context = 163_840 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/deepseek/deepseek-v3.toml b/providers/llmgateway/models/deepseek/deepseek-v3.toml new file mode 100644 index 000000000..a8205555b --- /dev/null +++ b/providers/llmgateway/models/deepseek/deepseek-v3.toml @@ -0,0 +1,21 @@ +name = "DeepSeek V3" +family = "deepseek" +release_date = "2024-12-26" +last_updated = "2024-12-26" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.15 +output = 0.40 + +[limit] +context = 163_840 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.0-flash-lite.toml b/providers/llmgateway/models/google/gemini-2.0-flash-lite.toml new file mode 100644 index 000000000..ec66df596 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.0-flash-lite.toml @@ -0,0 +1,21 @@ +name = "Gemini 2.0 Flash Lite" +family = "gemini" +release_date = "2025-02-25" +last_updated = "2025-02-25" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.08 +output = 0.30 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.0-flash.toml b/providers/llmgateway/models/google/gemini-2.0-flash.toml new file mode 100644 index 000000000..13813e688 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.0-flash.toml @@ -0,0 +1,21 @@ +name = "Gemini 2.0 Flash" +family = "gemini" +release_date = "2025-02-05" +last_updated = "2025-02-05" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.10 +output = 0.40 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-image-preview.toml b/providers/llmgateway/models/google/gemini-2.5-flash-image-preview.toml new file mode 100644 index 000000000..25d594d3a --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.5-flash-image-preview.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Image (Preview)" +family = "gemini" +release_date = "2025-10-02" +last_updated = "2025-10-02" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 0.30 +output = 30.00 + +[limit] +context = 32_800 +output = 8_200 + +[modalities] +input = ["text", "image"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-image.toml b/providers/llmgateway/models/google/gemini-2.5-flash-image.toml new file mode 100644 index 000000000..463827600 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.5-flash-image.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Image" +family = "gemini" +release_date = "2025-10-02" +last_updated = "2025-10-02" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 0.30 +output = 30.00 + +[limit] +context = 32_800 +output = 8_200 + +[modalities] +input = ["text", "image"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-lite-preview-09-2025.toml b/providers/llmgateway/models/google/gemini-2.5-flash-lite-preview-09-2025.toml new file mode 100644 index 000000000..3be518566 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.5-flash-lite-preview-09-2025.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Lite Preview (09-2025)" +family = "gemini" +release_date = "2025-09-25" +last_updated = "2025-09-25" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.10 +output = 0.40 +cache_read = 0.03 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-lite.toml b/providers/llmgateway/models/google/gemini-2.5-flash-lite.toml new file mode 100644 index 000000000..f2f36a655 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.5-flash-lite.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Lite" +family = "gemini" +release_date = "2025-07-22" +last_updated = "2025-07-22" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.10 +output = 0.40 +cache_read = 0.03 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-preview-09-2025.toml b/providers/llmgateway/models/google/gemini-2.5-flash-preview-09-2025.toml new file mode 100644 index 000000000..016e176f4 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.5-flash-preview-09-2025.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Preview (09-2025)" +family = "gemini" +release_date = "2025-09-25" +last_updated = "2025-09-25" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.30 +output = 2.50 +cache_read = 0.08 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.5-flash.toml b/providers/llmgateway/models/google/gemini-2.5-flash.toml new file mode 100644 index 000000000..e554e4953 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.5-flash.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash" +family = "gemini" +release_date = "2025-08-26" +last_updated = "2025-08-26" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.30 +output = 2.50 +cache_read = 0.08 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-2.5-pro.toml b/providers/llmgateway/models/google/gemini-2.5-pro.toml new file mode 100644 index 000000000..8b5822ce6 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-2.5-pro.toml @@ -0,0 +1,21 @@ +name = "Gemini 2.5 Pro" +family = "gemini" +release_date = "2025-03-25" +last_updated = "2025-03-25" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-3-flash-preview.toml b/providers/llmgateway/models/google/gemini-3-flash-preview.toml new file mode 100644 index 000000000..8aae94d8a --- /dev/null +++ b/providers/llmgateway/models/google/gemini-3-flash-preview.toml @@ -0,0 +1,22 @@ +name = "Gemini 3 Flash (Preview)" +family = "gemini" +release_date = "2025-12-17" +last_updated = "2025-12-17" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.50 +output = 3.00 + +[limit] +context = 1_000_000 +output = 65_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-3-pro-image-preview.toml b/providers/llmgateway/models/google/gemini-3-pro-image-preview.toml new file mode 100644 index 000000000..2a3b2ee0e --- /dev/null +++ b/providers/llmgateway/models/google/gemini-3-pro-image-preview.toml @@ -0,0 +1,22 @@ +name = "Gemini 3 Pro Image (Preview)" +family = "gemini" +release_date = "2025-11-20" +last_updated = "2025-11-20" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 2.00 +output = 12.00 + +[limit] +context = 98_304 +output = 32_768 + +[modalities] +input = ["text", "image"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemini-3-pro-preview.toml b/providers/llmgateway/models/google/gemini-3-pro-preview.toml new file mode 100644 index 000000000..498444399 --- /dev/null +++ b/providers/llmgateway/models/google/gemini-3-pro-preview.toml @@ -0,0 +1,22 @@ +name = "Gemini 3 Pro (Preview)" +family = "gemini" +release_date = "2025-11-18" +last_updated = "2025-11-18" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 2.00 +output = 12.00 + +[limit] +context = 1_000_000 +output = 65_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemma-2-27b-it-together.toml b/providers/llmgateway/models/google/gemma-2-27b-it-together.toml new file mode 100644 index 000000000..3fca28b14 --- /dev/null +++ b/providers/llmgateway/models/google/gemma-2-27b-it-together.toml @@ -0,0 +1,21 @@ +name = "Gemma 2 27B IT" +family = "gemini" +release_date = "2024-06-27" +last_updated = "2024-06-27" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.08 +output = 0.08 + +[limit] +context = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemma-3-12b-it.toml b/providers/llmgateway/models/google/gemma-3-12b-it.toml new file mode 100644 index 000000000..11359a07d --- /dev/null +++ b/providers/llmgateway/models/google/gemma-3-12b-it.toml @@ -0,0 +1,21 @@ +name = "Gemma 3 12B IT" +family = "gemini" +release_date = "2025-03-10" +last_updated = "2025-03-10" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.08 +output = 0.30 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemma-3-1b-it.toml b/providers/llmgateway/models/google/gemma-3-1b-it.toml new file mode 100644 index 000000000..f24d5f4af --- /dev/null +++ b/providers/llmgateway/models/google/gemma-3-1b-it.toml @@ -0,0 +1,21 @@ +name = "Gemma 3 1B IT" +family = "gemini" +release_date = "2025-03-12" +last_updated = "2025-03-12" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.08 +output = 0.30 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemma-3-27b.toml b/providers/llmgateway/models/google/gemma-3-27b.toml new file mode 100644 index 000000000..f985d5c43 --- /dev/null +++ b/providers/llmgateway/models/google/gemma-3-27b.toml @@ -0,0 +1,21 @@ +name = "Gemma 3 27B" +family = "gemini" +release_date = "2025-03-12" +last_updated = "2025-03-12" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.27 +output = 0.27 + +[limit] +context = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemma-3-4b-it.toml b/providers/llmgateway/models/google/gemma-3-4b-it.toml new file mode 100644 index 000000000..aad27de8c --- /dev/null +++ b/providers/llmgateway/models/google/gemma-3-4b-it.toml @@ -0,0 +1,21 @@ +name = "Gemma 3 4B IT" +family = "gemini" +release_date = "2025-03-10" +last_updated = "2025-03-10" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.08 +output = 0.30 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemma-3n-e2b-it.toml b/providers/llmgateway/models/google/gemma-3n-e2b-it.toml new file mode 100644 index 000000000..39b1c0cfd --- /dev/null +++ b/providers/llmgateway/models/google/gemma-3n-e2b-it.toml @@ -0,0 +1,21 @@ +name = "Gemma 3n E2B IT" +family = "gemini" +release_date = "2025-06-26" +last_updated = "2025-06-26" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.08 +output = 0.30 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/google/gemma-3n-e4b-it.toml b/providers/llmgateway/models/google/gemma-3n-e4b-it.toml new file mode 100644 index 000000000..338f81bb9 --- /dev/null +++ b/providers/llmgateway/models/google/gemma-3n-e4b-it.toml @@ -0,0 +1,21 @@ +name = "Gemma 3n E4B IT" +family = "gemini" +release_date = "2025-06-26" +last_updated = "2025-06-26" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.08 +output = 0.30 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/llmgateway/auto.toml b/providers/llmgateway/models/llmgateway/auto.toml new file mode 100644 index 000000000..2b97f2d94 --- /dev/null +++ b/providers/llmgateway/models/llmgateway/auto.toml @@ -0,0 +1,21 @@ +name = "Auto Route" +family = "llmgateway" +release_date = "2024-01-01" +last_updated = "2024-01-01" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/llmgateway/custom.toml b/providers/llmgateway/models/llmgateway/custom.toml new file mode 100644 index 000000000..704724161 --- /dev/null +++ b/providers/llmgateway/models/llmgateway/custom.toml @@ -0,0 +1,21 @@ +name = "Custom Model" +family = "llmgateway" +release_date = "2024-01-01" +last_updated = "2024-01-01" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-3.1-70b-instruct.toml b/providers/llmgateway/models/meta/llama-3.1-70b-instruct.toml new file mode 100644 index 000000000..915daceeb --- /dev/null +++ b/providers/llmgateway/models/meta/llama-3.1-70b-instruct.toml @@ -0,0 +1,23 @@ +name = "Llama 3.1 70B Instruct" +family = "llama" +release_date = "2024-07-23" +last_updated = "2024-07-23" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true +status = "beta" + +[cost] +input = 0.72 +output = 0.72 + +[limit] +context = 128_000 +output = 2_048 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-3.1-8b-instruct.toml b/providers/llmgateway/models/meta/llama-3.1-8b-instruct.toml new file mode 100644 index 000000000..b2c2cbe0e --- /dev/null +++ b/providers/llmgateway/models/meta/llama-3.1-8b-instruct.toml @@ -0,0 +1,23 @@ +name = "Llama 3.1 8B Instruct" +family = "llama" +release_date = "2024-07-23" +last_updated = "2024-07-23" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true +status = "beta" + +[cost] +input = 0.22 +output = 0.22 + +[limit] +context = 128_000 +output = 2_048 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-3.1-nemotron-ultra-253b.toml b/providers/llmgateway/models/meta/llama-3.1-nemotron-ultra-253b.toml new file mode 100644 index 000000000..aad971910 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-3.1-nemotron-ultra-253b.toml @@ -0,0 +1,21 @@ +name = "Llama 3.1 Nemotron Ultra 253B" +family = "llama" +release_date = "2025-04-07" +last_updated = "2025-04-07" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.60 +output = 1.80 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-3.2-11b-instruct.toml b/providers/llmgateway/models/meta/llama-3.2-11b-instruct.toml new file mode 100644 index 000000000..9956a2ee2 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-3.2-11b-instruct.toml @@ -0,0 +1,22 @@ +name = "Llama 3.2 11B Instruct" +family = "llama" +release_date = "2024-09-25" +last_updated = "2024-09-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true +status = "beta" + +[cost] +input = 0.07 +output = 0.33 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-3.3-70b-instruct-free.toml b/providers/llmgateway/models/meta/llama-3.3-70b-instruct-free.toml new file mode 100644 index 000000000..67cc88ec0 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-3.3-70b-instruct-free.toml @@ -0,0 +1,21 @@ +name = "Meta Llama 3.3 70B Instruct (Free)" +family = "llama" +release_date = "2024-12-06" +last_updated = "2024-12-06" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-3.3-70b-instruct.toml b/providers/llmgateway/models/meta/llama-3.3-70b-instruct.toml new file mode 100644 index 000000000..b298b41f0 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-3.3-70b-instruct.toml @@ -0,0 +1,21 @@ +name = "Llama 3.3 70B Instruct" +family = "llama" +release_date = "2024-12-06" +last_updated = "2024-12-06" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.13 +output = 0.40 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-4-maverick-17b-instruct.toml b/providers/llmgateway/models/meta/llama-4-maverick-17b-instruct.toml new file mode 100644 index 000000000..b4d26ec55 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-4-maverick-17b-instruct.toml @@ -0,0 +1,23 @@ +name = "Llama 4 Maverick 17B Instruct" +family = "llama" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true +status = "beta" + +[cost] +input = 0.24 +output = 0.97 + +[limit] +context = 8_192 +output = 2_048 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-4-maverick-free.toml b/providers/llmgateway/models/meta/llama-4-maverick-free.toml new file mode 100644 index 000000000..7aa7b2935 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-4-maverick-free.toml @@ -0,0 +1,21 @@ +name = "Meta Llama 4 Maverick (Free)" +family = "llama" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-4-scout-17b-instruct.toml b/providers/llmgateway/models/meta/llama-4-scout-17b-instruct.toml new file mode 100644 index 000000000..9490f4215 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-4-scout-17b-instruct.toml @@ -0,0 +1,23 @@ +name = "Llama 4 Scout 17B Instruct" +family = "llama" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true +status = "beta" + +[cost] +input = 0.17 +output = 0.66 + +[limit] +context = 8_192 +output = 2_048 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-4-scout-free.toml b/providers/llmgateway/models/meta/llama-4-scout-free.toml new file mode 100644 index 000000000..b2ae4a8b2 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-4-scout-free.toml @@ -0,0 +1,21 @@ +name = "Meta Llama 4 Scout (Free)" +family = "llama" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-4-scout.toml b/providers/llmgateway/models/meta/llama-4-scout.toml new file mode 100644 index 000000000..256aa0138 --- /dev/null +++ b/providers/llmgateway/models/meta/llama-4-scout.toml @@ -0,0 +1,22 @@ +name = "Llama 4 Scout" +family = "llama" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = true +status = "beta" + +[cost] +input = 0.18 +output = 0.59 + +[limit] +context = 32_768 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/meta/llama-guard-4-12b.toml b/providers/llmgateway/models/meta/llama-guard-4-12b.toml new file mode 100644 index 000000000..1d820fd0d --- /dev/null +++ b/providers/llmgateway/models/meta/llama-guard-4-12b.toml @@ -0,0 +1,21 @@ +name = "Llama Guard 4 12B" +family = "llama" +release_date = "2025-04-30" +last_updated = "2025-04-30" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.20 +output = 0.20 + +[limit] +context = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/minimax/minimax-m2.1.toml b/providers/llmgateway/models/minimax/minimax-m2.1.toml new file mode 100644 index 000000000..17b6e62fe --- /dev/null +++ b/providers/llmgateway/models/minimax/minimax-m2.1.toml @@ -0,0 +1,23 @@ +name = "MiniMax M2.1" +family = "minimax" +release_date = "2025-12-23" +last_updated = "2025-12-23" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.30 +output = 1.20 +cache_read = 0.03 + +[limit] +context = 204_800 +output = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/mistral/mistral-large-latest.toml b/providers/llmgateway/models/mistral/mistral-large-latest.toml new file mode 100644 index 000000000..ea18276b1 --- /dev/null +++ b/providers/llmgateway/models/mistral/mistral-large-latest.toml @@ -0,0 +1,21 @@ +name = "Mistral Large Latest" +family = "mistral" +release_date = "2025-12-02" +last_updated = "2025-12-02" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 4.00 +output = 12.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/mistral/mixtral-8x7b-instruct-together.toml b/providers/llmgateway/models/mistral/mixtral-8x7b-instruct-together.toml new file mode 100644 index 000000000..d078931b8 --- /dev/null +++ b/providers/llmgateway/models/mistral/mixtral-8x7b-instruct-together.toml @@ -0,0 +1,21 @@ +name = "Mixtral 8x7B Instruct" +family = "mistral" +release_date = "2023-12-10" +last_updated = "2023-12-10" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.06 +output = 0.06 + +[limit] +context = 32_768 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/mistral/pixtral-large-latest.toml b/providers/llmgateway/models/mistral/pixtral-large-latest.toml new file mode 100644 index 000000000..f56e355b8 --- /dev/null +++ b/providers/llmgateway/models/mistral/pixtral-large-latest.toml @@ -0,0 +1,21 @@ +name = "Pixtral Large Latest" +family = "mistral" +release_date = "2024-11-18" +last_updated = "2024-11-18" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 4.00 +output = 12.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/moonshot/kimi-k2-0905-free.toml b/providers/llmgateway/models/moonshot/kimi-k2-0905-free.toml new file mode 100644 index 000000000..e386f653f --- /dev/null +++ b/providers/llmgateway/models/moonshot/kimi-k2-0905-free.toml @@ -0,0 +1,21 @@ +name = "Kimi Dev 0905 (Free)" +family = "kimi" +release_date = "2025-09-05" +last_updated = "2025-09-05" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 131_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/moonshot/kimi-k2-thinking-turbo.toml b/providers/llmgateway/models/moonshot/kimi-k2-thinking-turbo.toml new file mode 100644 index 000000000..89bf1d152 --- /dev/null +++ b/providers/llmgateway/models/moonshot/kimi-k2-thinking-turbo.toml @@ -0,0 +1,23 @@ +name = "Kimi K2 Thinking Turbo" +family = "moonshot" +release_date = "2025-11-06" +last_updated = "2025-11-06" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.15 +output = 8.00 +cache_read = 0.15 + +[limit] +context = 262_144 +output = 262_144 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/moonshot/kimi-k2-thinking.toml b/providers/llmgateway/models/moonshot/kimi-k2-thinking.toml new file mode 100644 index 000000000..fad4b66e4 --- /dev/null +++ b/providers/llmgateway/models/moonshot/kimi-k2-thinking.toml @@ -0,0 +1,23 @@ +name = "Kimi K2 Thinking" +family = "moonshot" +release_date = "2025-11-06" +last_updated = "2025-11-06" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.60 +output = 2.50 +cache_read = 0.15 + +[limit] +context = 262_144 +output = 262_144 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/moonshot/kimi-k2.toml b/providers/llmgateway/models/moonshot/kimi-k2.toml new file mode 100644 index 000000000..8ee8fbdc1 --- /dev/null +++ b/providers/llmgateway/models/moonshot/kimi-k2.toml @@ -0,0 +1,23 @@ +name = "Kimi K2" +family = "moonshot" +release_date = "2025-07-11" +last_updated = "2025-07-11" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.00 +output = 3.00 +cache_read = 0.50 + +[limit] +context = 131_072 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/nvidia/nemotron-nano-9b-v2.toml b/providers/llmgateway/models/nvidia/nemotron-nano-9b-v2.toml new file mode 100644 index 000000000..020437c46 --- /dev/null +++ b/providers/llmgateway/models/nvidia/nemotron-nano-9b-v2.toml @@ -0,0 +1,21 @@ +name = "Nemotron Nano 9B V2 (Free)" +family = "nvidia" +release_date = "2025-08-18" +last_updated = "2025-08-18" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-3.5-turbo.toml b/providers/llmgateway/models/openai/gpt-3.5-turbo.toml new file mode 100644 index 000000000..687b10243 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-3.5-turbo.toml @@ -0,0 +1,21 @@ +name = "GPT-3.5 Turbo" +family = "gpt" +release_date = "2022-11-30" +last_updated = "2022-11-30" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.50 +output = 1.50 + +[limit] +context = 16_385 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4-turbo.toml b/providers/llmgateway/models/openai/gpt-4-turbo.toml new file mode 100644 index 000000000..3d8e0a676 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4-turbo.toml @@ -0,0 +1,21 @@ +name = "GPT-4 Turbo" +family = "gpt" +release_date = "2023-11-06" +last_updated = "2023-11-06" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 10.00 +output = 30.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4.1-mini.toml b/providers/llmgateway/models/openai/gpt-4.1-mini.toml new file mode 100644 index 000000000..0d4a5028e --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4.1-mini.toml @@ -0,0 +1,21 @@ +name = "GPT-4.1 Mini" +family = "gpt" +release_date = "2025-04-14" +last_updated = "2025-04-14" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.40 +output = 1.60 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4.1-nano.toml b/providers/llmgateway/models/openai/gpt-4.1-nano.toml new file mode 100644 index 000000000..5fd989c10 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4.1-nano.toml @@ -0,0 +1,21 @@ +name = "GPT-4.1 Nano" +family = "gpt" +release_date = "2025-04-14" +last_updated = "2025-04-14" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.10 +output = 0.40 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4.1.toml b/providers/llmgateway/models/openai/gpt-4.1.toml new file mode 100644 index 000000000..9da5b49b1 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4.1.toml @@ -0,0 +1,21 @@ +name = "GPT-4.1" +family = "gpt" +release_date = "2025-04-14" +last_updated = "2025-04-14" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 2.00 +output = 8.00 + +[limit] +context = 1_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4.toml b/providers/llmgateway/models/openai/gpt-4.toml new file mode 100644 index 000000000..c54180af8 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4.toml @@ -0,0 +1,22 @@ +name = "GPT-4" +family = "gpt" +release_date = "2023-03-14" +last_updated = "2023-03-14" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 30.00 +output = 60.00 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4o-mini-search-preview.toml b/providers/llmgateway/models/openai/gpt-4o-mini-search-preview.toml new file mode 100644 index 000000000..82d810fdd --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4o-mini-search-preview.toml @@ -0,0 +1,22 @@ +name = "GPT-4o Mini Search Preview" +family = "gpt" +release_date = "2024-10-01" +last_updated = "2024-10-01" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = false + +[cost] +input = 0.15 +output = 0.60 + +[limit] +context = 128_000 +output = 16_384 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4o-mini.toml b/providers/llmgateway/models/openai/gpt-4o-mini.toml new file mode 100644 index 000000000..a4a199b1e --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4o-mini.toml @@ -0,0 +1,23 @@ +name = "GPT-4o Mini" +family = "gpt" +release_date = "2024-07-18" +last_updated = "2024-07-18" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.15 +output = 0.60 +cache_read = 0.08 + +[limit] +context = 128_000 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4o-search-preview.toml b/providers/llmgateway/models/openai/gpt-4o-search-preview.toml new file mode 100644 index 000000000..45efd2f55 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4o-search-preview.toml @@ -0,0 +1,22 @@ +name = "GPT-4o Search Preview" +family = "gpt" +release_date = "2024-10-01" +last_updated = "2024-10-01" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = false + +[cost] +input = 2.50 +output = 10.00 + +[limit] +context = 128_000 +output = 16_384 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-4o.toml b/providers/llmgateway/models/openai/gpt-4o.toml new file mode 100644 index 000000000..8ccca0582 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-4o.toml @@ -0,0 +1,23 @@ +name = "GPT-4o" +family = "gpt" +release_date = "2024-05-13" +last_updated = "2024-05-13" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 2.50 +output = 10.00 +cache_read = 1.25 + +[limit] +context = 128_000 +output = 16_384 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5-chat-latest.toml b/providers/llmgateway/models/openai/gpt-5-chat-latest.toml new file mode 100644 index 000000000..f2ff52f9d --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5-chat-latest.toml @@ -0,0 +1,23 @@ +name = "GPT-5 Chat Latest" +family = "gpt" +release_date = "2025-08-01" +last_updated = "2025-08-01" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.13 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5-mini.toml b/providers/llmgateway/models/openai/gpt-5-mini.toml new file mode 100644 index 000000000..1926ccb79 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5-mini.toml @@ -0,0 +1,23 @@ +name = "GPT-5 Mini" +family = "gpt" +release_date = "2025-08-01" +last_updated = "2025-08-01" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.25 +output = 2.00 +cache_read = 0.03 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5-nano.toml b/providers/llmgateway/models/openai/gpt-5-nano.toml new file mode 100644 index 000000000..905e7d7c2 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5-nano.toml @@ -0,0 +1,23 @@ +name = "GPT-5 Nano" +family = "gpt" +release_date = "2025-08-01" +last_updated = "2025-08-01" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.05 +output = 0.40 +cache_read = 0.01 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5-pro.toml b/providers/llmgateway/models/openai/gpt-5-pro.toml new file mode 100644 index 000000000..0bdcec99a --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5-pro.toml @@ -0,0 +1,22 @@ +name = "GPT-5 Pro" +family = "gpt" +release_date = "2025-08-01" +last_updated = "2025-08-01" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 15.00 +output = 120.00 + +[limit] +context = 400_000 +output = 272_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5.1-codex-mini.toml b/providers/llmgateway/models/openai/gpt-5.1-codex-mini.toml new file mode 100644 index 000000000..6bad6ac25 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5.1-codex-mini.toml @@ -0,0 +1,23 @@ +name = "GPT-5.1 Codex mini" +family = "gpt" +release_date = "2025-11-12" +last_updated = "2025-11-12" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.25 +output = 2.00 +cache_read = 0.03 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5.1-codex.toml b/providers/llmgateway/models/openai/gpt-5.1-codex.toml new file mode 100644 index 000000000..af38bff5d --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5.1-codex.toml @@ -0,0 +1,22 @@ +name = "GPT-5.1 Codex" +family = "gpt" +release_date = "2025-11-13" +last_updated = "2025-11-13" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 + +[limit] +context = 400_000 +output = 272_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5.1.toml b/providers/llmgateway/models/openai/gpt-5.1.toml new file mode 100644 index 000000000..1581dc2a2 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5.1.toml @@ -0,0 +1,23 @@ +name = "GPT-5.1" +family = "gpt" +release_date = "2025-11-01" +last_updated = "2025-11-01" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.13 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5.2-chat-latest.toml b/providers/llmgateway/models/openai/gpt-5.2-chat-latest.toml new file mode 100644 index 000000000..f31092eab --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5.2-chat-latest.toml @@ -0,0 +1,23 @@ +name = "GPT-5.2 Chat" +family = "gpt" +release_date = "2025-12-11" +last_updated = "2025-12-11" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = false +open_weights = false + +[cost] +input = 1.75 +output = 14.00 +cache_read = 0.18 + +[limit] +context = 128_000 +output = 16_400 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5.2-pro.toml b/providers/llmgateway/models/openai/gpt-5.2-pro.toml new file mode 100644 index 000000000..420230374 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5.2-pro.toml @@ -0,0 +1,22 @@ +name = "GPT-5.2 Pro" +family = "gpt" +release_date = "2025-12-11" +last_updated = "2025-12-11" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 21.00 +output = 168.00 + +[limit] +context = 400_000 +output = 272_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5.2.toml b/providers/llmgateway/models/openai/gpt-5.2.toml new file mode 100644 index 000000000..fd6a2a43b --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5.2.toml @@ -0,0 +1,23 @@ +name = "GPT-5.2" +family = "gpt" +release_date = "2025-12-11" +last_updated = "2025-12-11" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.75 +output = 14.00 +cache_read = 0.18 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-5.toml b/providers/llmgateway/models/openai/gpt-5.toml new file mode 100644 index 000000000..5c86e3140 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-5.toml @@ -0,0 +1,23 @@ +name = "GPT-5" +family = "gpt" +release_date = "2025-08-01" +last_updated = "2025-08-01" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.13 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-oss-120b.toml b/providers/llmgateway/models/openai/gpt-oss-120b.toml new file mode 100644 index 000000000..422a24553 --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-oss-120b.toml @@ -0,0 +1,22 @@ +name = "GPT OSS 120B" +family = "gpt" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.15 +output = 0.75 + +[limit] +context = 131_072 +output = 32_766 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-oss-20b-free.toml b/providers/llmgateway/models/openai/gpt-oss-20b-free.toml new file mode 100644 index 000000000..a7e17f57a --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-oss-20b-free.toml @@ -0,0 +1,21 @@ +name = "GPT OSS 20B (Free)" +family = "gpt-oss" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/gpt-oss-20b.toml b/providers/llmgateway/models/openai/gpt-oss-20b.toml new file mode 100644 index 000000000..ee5983c6e --- /dev/null +++ b/providers/llmgateway/models/openai/gpt-oss-20b.toml @@ -0,0 +1,22 @@ +name = "GPT OSS 20B" +family = "gpt" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.10 +output = 0.50 + +[limit] +context = 131_072 +output = 32_766 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/o1-mini.toml b/providers/llmgateway/models/openai/o1-mini.toml new file mode 100644 index 000000000..6e5858e7a --- /dev/null +++ b/providers/llmgateway/models/openai/o1-mini.toml @@ -0,0 +1,22 @@ +name = "o1 Mini" +family = "gpt" +release_date = "2024-09-12" +last_updated = "2024-09-12" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = false +status = "beta" + +[cost] +input = 1.10 +output = 4.40 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/o1.toml b/providers/llmgateway/models/openai/o1.toml new file mode 100644 index 000000000..fdcc29e57 --- /dev/null +++ b/providers/llmgateway/models/openai/o1.toml @@ -0,0 +1,21 @@ +name = "o1" +family = "gpt" +release_date = "2024-09-12" +last_updated = "2024-09-12" +attachment = true +reasoning = true +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 15.00 +output = 60.00 + +[limit] +context = 200_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/o3-mini.toml b/providers/llmgateway/models/openai/o3-mini.toml new file mode 100644 index 000000000..4ac3fa9b5 --- /dev/null +++ b/providers/llmgateway/models/openai/o3-mini.toml @@ -0,0 +1,21 @@ +name = "o3 Mini" +family = "gpt" +release_date = "2025-06-01" +last_updated = "2025-06-01" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 1.10 +output = 4.40 + +[limit] +context = 200_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/openai/o3.toml b/providers/llmgateway/models/openai/o3.toml new file mode 100644 index 000000000..bf81a3035 --- /dev/null +++ b/providers/llmgateway/models/openai/o3.toml @@ -0,0 +1,21 @@ +name = "o3" +family = "gpt" +release_date = "2025-06-01" +last_updated = "2025-06-01" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 2.00 +output = 8.00 + +[limit] +context = 200_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/perplexity/sonar-pro.toml b/providers/llmgateway/models/perplexity/sonar-pro.toml new file mode 100644 index 000000000..80d05b4d1 --- /dev/null +++ b/providers/llmgateway/models/perplexity/sonar-pro.toml @@ -0,0 +1,21 @@ +name = "Sonar Pro" +family = "sonar" +release_date = "2025-03-07" +last_updated = "2025-03-07" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 + +[limit] +context = 200_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/perplexity/sonar-reasoning-pro.toml b/providers/llmgateway/models/perplexity/sonar-reasoning-pro.toml new file mode 100644 index 000000000..72f099ec5 --- /dev/null +++ b/providers/llmgateway/models/perplexity/sonar-reasoning-pro.toml @@ -0,0 +1,21 @@ +name = "Sonar Reasoning Pro" +family = "sonar" +release_date = "2025-03-07" +last_updated = "2025-03-07" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 2.00 +output = 8.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/perplexity/sonar.toml b/providers/llmgateway/models/perplexity/sonar.toml new file mode 100644 index 000000000..8a9b44c64 --- /dev/null +++ b/providers/llmgateway/models/perplexity/sonar.toml @@ -0,0 +1,21 @@ +name = "Sonar" +family = "sonar" +release_date = "2025-01-01" +last_updated = "2025-01-01" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 1.00 +output = 1.00 + +[limit] +context = 130_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-3-mini.toml b/providers/llmgateway/models/xai/grok-3-mini.toml new file mode 100644 index 000000000..cce79b8b8 --- /dev/null +++ b/providers/llmgateway/models/xai/grok-3-mini.toml @@ -0,0 +1,21 @@ +name = "Grok-3 Mini" +family = "grok" +release_date = "2025-04-09" +last_updated = "2025-04-09" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.30 +output = 0.50 + +[limit] +context = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-3.toml b/providers/llmgateway/models/xai/grok-3.toml new file mode 100644 index 000000000..fc9570b94 --- /dev/null +++ b/providers/llmgateway/models/xai/grok-3.toml @@ -0,0 +1,21 @@ +name = "Grok-3" +family = "grok" +release_date = "2025-02-17" +last_updated = "2025-02-17" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 + +[limit] +context = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-4-0709.toml b/providers/llmgateway/models/xai/grok-4-0709.toml new file mode 100644 index 000000000..1c7dba3fc --- /dev/null +++ b/providers/llmgateway/models/xai/grok-4-0709.toml @@ -0,0 +1,22 @@ +name = "Grok 4 (0709)" +family = "grok" +release_date = "2025-07-09" +last_updated = "2025-07-09" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 + +[limit] +context = 256_000 +output = 256_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-4-1-fast-non-reasoning.toml b/providers/llmgateway/models/xai/grok-4-1-fast-non-reasoning.toml new file mode 100644 index 000000000..58dc2022d --- /dev/null +++ b/providers/llmgateway/models/xai/grok-4-1-fast-non-reasoning.toml @@ -0,0 +1,21 @@ +name = "Grok 4.1 Fast Non-Reasoning" +family = "grok" +release_date = "2025-11-19" +last_updated = "2025-11-19" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 + +[limit] +context = 2_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-4-1-fast-reasoning.toml b/providers/llmgateway/models/xai/grok-4-1-fast-reasoning.toml new file mode 100644 index 000000000..55d855599 --- /dev/null +++ b/providers/llmgateway/models/xai/grok-4-1-fast-reasoning.toml @@ -0,0 +1,21 @@ +name = "Grok 4.1 Fast Reasoning" +family = "grok" +release_date = "2025-11-19" +last_updated = "2025-11-19" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 + +[limit] +context = 2_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-4-fast-non-reasoning.toml b/providers/llmgateway/models/xai/grok-4-fast-non-reasoning.toml new file mode 100644 index 000000000..1dae5d1b0 --- /dev/null +++ b/providers/llmgateway/models/xai/grok-4-fast-non-reasoning.toml @@ -0,0 +1,22 @@ +name = "Grok 4 Fast Non-Reasoning" +family = "grok" +release_date = "2025-10-10" +last_updated = "2025-10-10" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.40 +output = 1.00 +cache_read = 0.05 + +[limit] +context = 2_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-4-fast-reasoning.toml b/providers/llmgateway/models/xai/grok-4-fast-reasoning.toml new file mode 100644 index 000000000..9b6b2c0dc --- /dev/null +++ b/providers/llmgateway/models/xai/grok-4-fast-reasoning.toml @@ -0,0 +1,22 @@ +name = "Grok 4 Fast Reasoning" +family = "grok" +release_date = "2025-07-09" +last_updated = "2025-07-09" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.40 +output = 1.00 +cache_read = 0.05 + +[limit] +context = 2_000_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-4.toml b/providers/llmgateway/models/xai/grok-4.toml new file mode 100644 index 000000000..e9904febf --- /dev/null +++ b/providers/llmgateway/models/xai/grok-4.toml @@ -0,0 +1,22 @@ +name = "Grok 4" +family = "grok" +release_date = "2025-07-09" +last_updated = "2025-07-09" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 + +[limit] +context = 256_000 +output = 256_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/xai/grok-code-fast-1.toml b/providers/llmgateway/models/xai/grok-code-fast-1.toml new file mode 100644 index 000000000..6428c94e9 --- /dev/null +++ b/providers/llmgateway/models/xai/grok-code-fast-1.toml @@ -0,0 +1,22 @@ +name = "Grok Code Fast 1" +family = "grok" +release_date = "2025-08-28" +last_updated = "2025-08-28" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.20 +output = 1.50 + +[limit] +context = 256_000 +output = 10_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/cogview-4.toml b/providers/llmgateway/models/zai/cogview-4.toml new file mode 100644 index 000000000..45b21ce82 --- /dev/null +++ b/providers/llmgateway/models/zai/cogview-4.toml @@ -0,0 +1,22 @@ +name = "CogView-4" +family = "zai" +release_date = "2025-03-04" +last_updated = "2025-03-04" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4-32b-0414-128k.toml b/providers/llmgateway/models/zai/glm-4-32b-0414-128k.toml new file mode 100644 index 000000000..10c00a8d5 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4-32b-0414-128k.toml @@ -0,0 +1,21 @@ +name = "GLM-4 32B (0414-128k)" +family = "glm" +release_date = "2025-04-14" +last_updated = "2025-04-14" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.10 +output = 0.10 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.5-air-free.toml b/providers/llmgateway/models/zai/glm-4.5-air-free.toml new file mode 100644 index 000000000..3fdadfc97 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.5-air-free.toml @@ -0,0 +1,21 @@ +name = "GLM-4.5 Air (Free)" +family = "glm" +release_date = "2025-07-25" +last_updated = "2025-07-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.5-air.toml b/providers/llmgateway/models/zai/glm-4.5-air.toml new file mode 100644 index 000000000..ad2807cd8 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.5-air.toml @@ -0,0 +1,22 @@ +name = "GLM-4.5 Air" +family = "glm" +release_date = "2025-07-25" +last_updated = "2025-07-25" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.20 +output = 1.10 +cache_read = 0.03 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.5-airx.toml b/providers/llmgateway/models/zai/glm-4.5-airx.toml new file mode 100644 index 000000000..9271836e0 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.5-airx.toml @@ -0,0 +1,22 @@ +name = "GLM-4.5 AirX" +family = "glm" +release_date = "2025-07-28" +last_updated = "2025-07-28" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.10 +output = 4.50 +cache_read = 0.22 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.5-flash.toml b/providers/llmgateway/models/zai/glm-4.5-flash.toml new file mode 100644 index 000000000..c2a28d5f5 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.5-flash.toml @@ -0,0 +1,21 @@ +name = "GLM-4.5 Flash" +family = "glm" +release_date = "2025-08-13" +last_updated = "2025-08-13" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.5-x.toml b/providers/llmgateway/models/zai/glm-4.5-x.toml new file mode 100644 index 000000000..fd3226bc4 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.5-x.toml @@ -0,0 +1,23 @@ +name = "GLM-4.5 X" +family = "glm" +release_date = "2025-07-28" +last_updated = "2025-07-28" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false +status = "beta" + +[cost] +input = 2.20 +output = 8.90 +cache_read = 0.45 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.5.toml b/providers/llmgateway/models/zai/glm-4.5.toml new file mode 100644 index 000000000..aa4e01188 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.5.toml @@ -0,0 +1,22 @@ +name = "GLM-4.5" +family = "glm" +release_date = "2025-07-28" +last_updated = "2025-07-28" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.60 +output = 2.20 +cache_read = 0.11 + +[limit] +context = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.5v.toml b/providers/llmgateway/models/zai/glm-4.5v.toml new file mode 100644 index 000000000..a404f8abe --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.5v.toml @@ -0,0 +1,23 @@ +name = "GLM-4.5V" +family = "glm" +release_date = "2025-08-11" +last_updated = "2025-08-11" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.60 +output = 1.80 +cache_read = 0.11 + +[limit] +context = 128_000 +output = 16_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.6.toml b/providers/llmgateway/models/zai/glm-4.6.toml new file mode 100644 index 000000000..0019cbb11 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.6.toml @@ -0,0 +1,22 @@ +name = "GLM-4.6" +family = "glm" +release_date = "2025-09-30" +last_updated = "2025-09-30" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.60 +output = 2.20 +cache_read = 0.11 + +[limit] +context = 200_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.6v-flash.toml b/providers/llmgateway/models/zai/glm-4.6v-flash.toml new file mode 100644 index 000000000..7fc75e7e6 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.6v-flash.toml @@ -0,0 +1,22 @@ +name = "GLM-4.6V Flash" +family = "glm" +release_date = "2025-12-08" +last_updated = "2025-12-08" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 128_000 +output = 16_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.6v-flashx.toml b/providers/llmgateway/models/zai/glm-4.6v-flashx.toml new file mode 100644 index 000000000..993b36242 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.6v-flashx.toml @@ -0,0 +1,23 @@ +name = "GLM-4.6V FlashX" +family = "glm" +release_date = "2025-12-08" +last_updated = "2025-12-08" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.04 +output = 0.40 +cache_read = 0.00 + +[limit] +context = 128_000 +output = 16_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.6v.toml b/providers/llmgateway/models/zai/glm-4.6v.toml new file mode 100644 index 000000000..b13d5762d --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.6v.toml @@ -0,0 +1,23 @@ +name = "GLM-4.6V" +family = "glm" +release_date = "2025-12-08" +last_updated = "2025-12-08" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.30 +output = 0.90 +cache_read = 0.05 + +[limit] +context = 128_000 +output = 16_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.7-flash.toml b/providers/llmgateway/models/zai/glm-4.7-flash.toml new file mode 100644 index 000000000..c390fbb38 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.7-flash.toml @@ -0,0 +1,22 @@ +name = "GLM-4.7 Flash" +family = "glm" +release_date = "2025-12-22" +last_updated = "2025-12-22" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 200_000 +output = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.7-flashx.toml b/providers/llmgateway/models/zai/glm-4.7-flashx.toml new file mode 100644 index 000000000..b1e5111ad --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.7-flashx.toml @@ -0,0 +1,23 @@ +name = "GLM-4.7 FlashX" +family = "glm" +release_date = "2025-12-22" +last_updated = "2025-12-22" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.07 +output = 0.40 +cache_read = 0.01 + +[limit] +context = 200_000 +output = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-4.7.toml b/providers/llmgateway/models/zai/glm-4.7.toml new file mode 100644 index 000000000..103e57c9a --- /dev/null +++ b/providers/llmgateway/models/zai/glm-4.7.toml @@ -0,0 +1,23 @@ +name = "GLM-4.7" +family = "glm" +release_date = "2025-12-22" +last_updated = "2025-12-22" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.60 +output = 2.20 +cache_read = 0.11 + +[limit] +context = 200_000 +output = 128_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/llmgateway/models/zai/glm-image.toml b/providers/llmgateway/models/zai/glm-image.toml new file mode 100644 index 000000000..43af1a0b5 --- /dev/null +++ b/providers/llmgateway/models/zai/glm-image.toml @@ -0,0 +1,22 @@ +name = "GLM-Image" +family = "glm" +release_date = "2025-01-14" +last_updated = "2025-01-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 2_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/llmgateway/provider.toml b/providers/llmgateway/provider.toml new file mode 100644 index 000000000..7f3a03eac --- /dev/null +++ b/providers/llmgateway/provider.toml @@ -0,0 +1,5 @@ +name = "LLM Gateway" +env = ["LLMGATEWAY_API_KEY"] +npm = "@ai-sdk/openai-compatible" +doc = "https://llmgateway.io/docs" +api = "https://api.llmgateway.io/v1" \ No newline at end of file diff --git a/providers/llmgateway/scripts/generate.ts b/providers/llmgateway/scripts/generate.ts new file mode 100644 index 000000000..b2018fcef --- /dev/null +++ b/providers/llmgateway/scripts/generate.ts @@ -0,0 +1,11 @@ +/** + * This script generates model TOML files from the LLM Gateway models package. + * + * Run from the llmgateway repository root: + * npx tsx scripts/export-models-dev.ts + * + * The script reads models from @llmgateway/models and generates TOML files + * organized by provider subdirectory. + */ + +// See: https://github.com/theopenco/llmgateway/blob/main/scripts/export-models-dev.ts From 24e575a86e56603afb57216af3ec59a9bd7abb5e Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:15:27 +0000 Subject: [PATCH 2/8] refactor: flatten model structure to models/ directory Removes provider subdirectories, exports all models directly to models/ folder for simpler structure. Co-Authored-By: Claude Opus 4.5 --- providers/llmgateway/README.md | 14 ++------------ .../llmgateway/models/{llmgateway => }/auto.toml | 0 .../{anthropic => }/claude-3-5-haiku-20241022.toml | 0 .../models/{anthropic => }/claude-3-5-haiku.toml | 0 .../claude-3-5-sonnet-20240620.toml | 0 .../models/{anthropic => }/claude-3-5-sonnet.toml | 0 .../claude-3-7-sonnet-20250219.toml | 0 .../models/{anthropic => }/claude-3-7-sonnet.toml | 0 .../models/{anthropic => }/claude-3-haiku.toml | 0 .../models/{anthropic => }/claude-3-opus.toml | 0 .../{anthropic => }/claude-haiku-4-5-20251001.toml | 0 .../models/{anthropic => }/claude-haiku-4-5.toml | 0 .../{anthropic => }/claude-opus-4-1-20250805.toml | 0 .../{anthropic => }/claude-opus-4-20250514.toml | 0 .../{anthropic => }/claude-opus-4-5-20251101.toml | 0 .../{anthropic => }/claude-sonnet-4-20250514.toml | 0 .../claude-sonnet-4-5-20250929.toml | 0 .../models/{anthropic => }/claude-sonnet-4-5.toml | 0 .../llmgateway/models/{zai => }/cogview-4.toml | 0 .../llmgateway/models/{llmgateway => }/custom.toml | 0 .../models/{deepseek => }/deepseek-r1-0528.toml | 0 .../{deepseek => }/deepseek-r1t2-chimera-free.toml | 0 .../models/{deepseek => }/deepseek-v3.1.toml | 0 .../models/{deepseek => }/deepseek-v3.2.toml | 0 .../models/{deepseek => }/deepseek-v3.toml | 0 .../models/{google => }/gemini-2.0-flash-lite.toml | 0 .../models/{google => }/gemini-2.0-flash.toml | 0 .../gemini-2.5-flash-image-preview.toml | 0 .../{google => }/gemini-2.5-flash-image.toml | 0 .../gemini-2.5-flash-lite-preview-09-2025.toml | 0 .../models/{google => }/gemini-2.5-flash-lite.toml | 0 .../gemini-2.5-flash-preview-09-2025.toml | 0 .../models/{google => }/gemini-2.5-flash.toml | 0 .../models/{google => }/gemini-2.5-pro.toml | 0 .../{google => }/gemini-3-flash-preview.toml | 0 .../{google => }/gemini-3-pro-image-preview.toml | 0 .../models/{google => }/gemini-3-pro-preview.toml | 0 .../{google => }/gemma-2-27b-it-together.toml | 0 .../models/{google => }/gemma-3-12b-it.toml | 0 .../models/{google => }/gemma-3-1b-it.toml | 0 .../models/{google => }/gemma-3-27b.toml | 0 .../models/{google => }/gemma-3-4b-it.toml | 0 .../models/{google => }/gemma-3n-e2b-it.toml | 0 .../models/{google => }/gemma-3n-e4b-it.toml | 0 .../models/{zai => }/glm-4-32b-0414-128k.toml | 0 .../models/{zai => }/glm-4.5-air-free.toml | 0 .../llmgateway/models/{zai => }/glm-4.5-air.toml | 0 .../llmgateway/models/{zai => }/glm-4.5-airx.toml | 0 .../llmgateway/models/{zai => }/glm-4.5-flash.toml | 0 .../llmgateway/models/{zai => }/glm-4.5-x.toml | 0 providers/llmgateway/models/{zai => }/glm-4.5.toml | 0 .../llmgateway/models/{zai => }/glm-4.5v.toml | 0 providers/llmgateway/models/{zai => }/glm-4.6.toml | 0 .../models/{zai => }/glm-4.6v-flash.toml | 0 .../models/{zai => }/glm-4.6v-flashx.toml | 0 .../llmgateway/models/{zai => }/glm-4.6v.toml | 0 .../llmgateway/models/{zai => }/glm-4.7-flash.toml | 0 .../models/{zai => }/glm-4.7-flashx.toml | 0 providers/llmgateway/models/{zai => }/glm-4.7.toml | 0 .../llmgateway/models/{zai => }/glm-image.toml | 0 .../models/{openai => }/gpt-3.5-turbo.toml | 0 .../models/{openai => }/gpt-4-turbo.toml | 0 .../models/{openai => }/gpt-4.1-mini.toml | 0 .../models/{openai => }/gpt-4.1-nano.toml | 0 .../llmgateway/models/{openai => }/gpt-4.1.toml | 0 .../llmgateway/models/{openai => }/gpt-4.toml | 0 .../{openai => }/gpt-4o-mini-search-preview.toml | 0 .../models/{openai => }/gpt-4o-mini.toml | 0 .../models/{openai => }/gpt-4o-search-preview.toml | 0 .../llmgateway/models/{openai => }/gpt-4o.toml | 0 .../models/{openai => }/gpt-5-chat-latest.toml | 0 .../llmgateway/models/{openai => }/gpt-5-mini.toml | 0 .../llmgateway/models/{openai => }/gpt-5-nano.toml | 0 .../llmgateway/models/{openai => }/gpt-5-pro.toml | 0 .../models/{openai => }/gpt-5.1-codex-mini.toml | 0 .../models/{openai => }/gpt-5.1-codex.toml | 0 .../llmgateway/models/{openai => }/gpt-5.1.toml | 0 .../models/{openai => }/gpt-5.2-chat-latest.toml | 0 .../models/{openai => }/gpt-5.2-pro.toml | 0 .../llmgateway/models/{openai => }/gpt-5.2.toml | 0 .../llmgateway/models/{openai => }/gpt-5.toml | 0 .../models/{openai => }/gpt-oss-120b.toml | 0 .../models/{openai => }/gpt-oss-20b-free.toml | 0 .../models/{openai => }/gpt-oss-20b.toml | 0 .../llmgateway/models/{xai => }/grok-3-mini.toml | 0 providers/llmgateway/models/{xai => }/grok-3.toml | 0 .../llmgateway/models/{xai => }/grok-4-0709.toml | 0 .../{xai => }/grok-4-1-fast-non-reasoning.toml | 0 .../models/{xai => }/grok-4-1-fast-reasoning.toml | 0 .../{xai => }/grok-4-fast-non-reasoning.toml | 0 .../models/{xai => }/grok-4-fast-reasoning.toml | 0 providers/llmgateway/models/{xai => }/grok-4.toml | 0 .../models/{xai => }/grok-code-fast-1.toml | 0 .../models/{moonshot => }/kimi-k2-0905-free.toml | 0 .../{moonshot => }/kimi-k2-thinking-turbo.toml | 0 .../models/{moonshot => }/kimi-k2-thinking.toml | 0 .../llmgateway/models/{moonshot => }/kimi-k2.toml | 0 .../models/{meta => }/llama-3.1-70b-instruct.toml | 0 .../models/{meta => }/llama-3.1-8b-instruct.toml | 0 .../{meta => }/llama-3.1-nemotron-ultra-253b.toml | 0 .../models/{meta => }/llama-3.2-11b-instruct.toml | 0 .../{meta => }/llama-3.3-70b-instruct-free.toml | 0 .../models/{meta => }/llama-3.3-70b-instruct.toml | 0 .../{meta => }/llama-4-maverick-17b-instruct.toml | 0 .../models/{meta => }/llama-4-maverick-free.toml | 0 .../{meta => }/llama-4-scout-17b-instruct.toml | 0 .../models/{meta => }/llama-4-scout-free.toml | 0 .../models/{meta => }/llama-4-scout.toml | 0 .../models/{meta => }/llama-guard-4-12b.toml | 0 .../models/{minimax => }/minimax-m2.1.toml | 0 .../models/{mistral => }/mistral-large-latest.toml | 0 .../mixtral-8x7b-instruct-together.toml | 0 .../models/{nvidia => }/nemotron-nano-9b-v2.toml | 0 .../llmgateway/models/{openai => }/o1-mini.toml | 0 providers/llmgateway/models/{openai => }/o1.toml | 0 .../llmgateway/models/{openai => }/o3-mini.toml | 0 providers/llmgateway/models/{openai => }/o3.toml | 0 .../models/{mistral => }/pixtral-large-latest.toml | 0 .../models/{alibaba => }/qwen-flash.toml | 0 .../{alibaba => }/qwen-image-max-2025-12-30.toml | 0 .../models/{alibaba => }/qwen-image-max.toml | 0 .../models/{alibaba => }/qwen-image-plus.toml | 0 .../models/{alibaba => }/qwen-image.toml | 0 .../models/{alibaba => }/qwen-max-latest.toml | 0 .../llmgateway/models/{alibaba => }/qwen-max.toml | 0 .../models/{alibaba => }/qwen-omni-turbo.toml | 0 .../models/{alibaba => }/qwen-plus-latest.toml | 0 .../llmgateway/models/{alibaba => }/qwen-plus.toml | 0 .../models/{alibaba => }/qwen-turbo.toml | 0 .../models/{alibaba => }/qwen-vl-max.toml | 0 .../models/{alibaba => }/qwen-vl-plus.toml | 0 .../{alibaba => }/qwen2-5-vl-72b-instruct.toml | 0 .../models/{alibaba => }/qwen25-coder-7b.toml | 0 .../qwen3-235b-a22b-instruct-2507.toml | 0 .../qwen3-235b-a22b-thinking-2507.toml | 0 .../{alibaba => }/qwen3-30b-a3b-instruct-2507.toml | 0 .../{alibaba => }/qwen3-30b-a3b-thinking-2507.toml | 0 .../llmgateway/models/{alibaba => }/qwen3-32b.toml | 0 .../qwen3-coder-30b-a3b-instruct.toml | 0 .../qwen3-coder-480b-a35b-instruct.toml | 0 .../models/{alibaba => }/qwen3-coder-plus.toml | 0 .../models/{alibaba => }/qwen3-coder.toml | 0 .../llmgateway/models/{alibaba => }/qwen3-max.toml | 0 .../{alibaba => }/qwen3-next-80b-a3b-instruct.toml | 0 .../{alibaba => }/qwen3-next-80b-a3b-thinking.toml | 0 .../models/{bytedance => }/seed-1-6-250615.toml | 0 .../models/{bytedance => }/seed-1-6-250915.toml | 0 .../{bytedance => }/seed-1-6-flash-250715.toml | 0 .../models/{bytedance => }/seed-1-8-251228.toml | 0 .../models/{bytedance => }/seedream-4-0.toml | 0 .../models/{bytedance => }/seedream-4-5.toml | 0 .../models/{perplexity => }/sonar-pro.toml | 0 .../{perplexity => }/sonar-reasoning-pro.toml | 0 .../llmgateway/models/{perplexity => }/sonar.toml | 0 providers/llmgateway/scripts/generate.ts | 2 +- 155 files changed, 3 insertions(+), 13 deletions(-) rename providers/llmgateway/models/{llmgateway => }/auto.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-5-haiku-20241022.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-5-haiku.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-5-sonnet-20240620.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-5-sonnet.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-7-sonnet-20250219.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-7-sonnet.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-haiku.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-3-opus.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-haiku-4-5-20251001.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-haiku-4-5.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-opus-4-1-20250805.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-opus-4-20250514.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-opus-4-5-20251101.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-sonnet-4-20250514.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-sonnet-4-5-20250929.toml (100%) rename providers/llmgateway/models/{anthropic => }/claude-sonnet-4-5.toml (100%) rename providers/llmgateway/models/{zai => }/cogview-4.toml (100%) rename providers/llmgateway/models/{llmgateway => }/custom.toml (100%) rename providers/llmgateway/models/{deepseek => }/deepseek-r1-0528.toml (100%) rename providers/llmgateway/models/{deepseek => }/deepseek-r1t2-chimera-free.toml (100%) rename providers/llmgateway/models/{deepseek => }/deepseek-v3.1.toml (100%) rename providers/llmgateway/models/{deepseek => }/deepseek-v3.2.toml (100%) rename providers/llmgateway/models/{deepseek => }/deepseek-v3.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.0-flash-lite.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.0-flash.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.5-flash-image-preview.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.5-flash-image.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.5-flash-lite-preview-09-2025.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.5-flash-lite.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.5-flash-preview-09-2025.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.5-flash.toml (100%) rename providers/llmgateway/models/{google => }/gemini-2.5-pro.toml (100%) rename providers/llmgateway/models/{google => }/gemini-3-flash-preview.toml (100%) rename providers/llmgateway/models/{google => }/gemini-3-pro-image-preview.toml (100%) rename providers/llmgateway/models/{google => }/gemini-3-pro-preview.toml (100%) rename providers/llmgateway/models/{google => }/gemma-2-27b-it-together.toml (100%) rename providers/llmgateway/models/{google => }/gemma-3-12b-it.toml (100%) rename providers/llmgateway/models/{google => }/gemma-3-1b-it.toml (100%) rename providers/llmgateway/models/{google => }/gemma-3-27b.toml (100%) rename providers/llmgateway/models/{google => }/gemma-3-4b-it.toml (100%) rename providers/llmgateway/models/{google => }/gemma-3n-e2b-it.toml (100%) rename providers/llmgateway/models/{google => }/gemma-3n-e4b-it.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4-32b-0414-128k.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.5-air-free.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.5-air.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.5-airx.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.5-flash.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.5-x.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.5.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.5v.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.6.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.6v-flash.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.6v-flashx.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.6v.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.7-flash.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.7-flashx.toml (100%) rename providers/llmgateway/models/{zai => }/glm-4.7.toml (100%) rename providers/llmgateway/models/{zai => }/glm-image.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-3.5-turbo.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4-turbo.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4.1-mini.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4.1-nano.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4.1.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4o-mini-search-preview.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4o-mini.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4o-search-preview.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-4o.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5-chat-latest.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5-mini.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5-nano.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5-pro.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5.1-codex-mini.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5.1-codex.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5.1.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5.2-chat-latest.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5.2-pro.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5.2.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-5.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-oss-120b.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-oss-20b-free.toml (100%) rename providers/llmgateway/models/{openai => }/gpt-oss-20b.toml (100%) rename providers/llmgateway/models/{xai => }/grok-3-mini.toml (100%) rename providers/llmgateway/models/{xai => }/grok-3.toml (100%) rename providers/llmgateway/models/{xai => }/grok-4-0709.toml (100%) rename providers/llmgateway/models/{xai => }/grok-4-1-fast-non-reasoning.toml (100%) rename providers/llmgateway/models/{xai => }/grok-4-1-fast-reasoning.toml (100%) rename providers/llmgateway/models/{xai => }/grok-4-fast-non-reasoning.toml (100%) rename providers/llmgateway/models/{xai => }/grok-4-fast-reasoning.toml (100%) rename providers/llmgateway/models/{xai => }/grok-4.toml (100%) rename providers/llmgateway/models/{xai => }/grok-code-fast-1.toml (100%) rename providers/llmgateway/models/{moonshot => }/kimi-k2-0905-free.toml (100%) rename providers/llmgateway/models/{moonshot => }/kimi-k2-thinking-turbo.toml (100%) rename providers/llmgateway/models/{moonshot => }/kimi-k2-thinking.toml (100%) rename providers/llmgateway/models/{moonshot => }/kimi-k2.toml (100%) rename providers/llmgateway/models/{meta => }/llama-3.1-70b-instruct.toml (100%) rename providers/llmgateway/models/{meta => }/llama-3.1-8b-instruct.toml (100%) rename providers/llmgateway/models/{meta => }/llama-3.1-nemotron-ultra-253b.toml (100%) rename providers/llmgateway/models/{meta => }/llama-3.2-11b-instruct.toml (100%) rename providers/llmgateway/models/{meta => }/llama-3.3-70b-instruct-free.toml (100%) rename providers/llmgateway/models/{meta => }/llama-3.3-70b-instruct.toml (100%) rename providers/llmgateway/models/{meta => }/llama-4-maverick-17b-instruct.toml (100%) rename providers/llmgateway/models/{meta => }/llama-4-maverick-free.toml (100%) rename providers/llmgateway/models/{meta => }/llama-4-scout-17b-instruct.toml (100%) rename providers/llmgateway/models/{meta => }/llama-4-scout-free.toml (100%) rename providers/llmgateway/models/{meta => }/llama-4-scout.toml (100%) rename providers/llmgateway/models/{meta => }/llama-guard-4-12b.toml (100%) rename providers/llmgateway/models/{minimax => }/minimax-m2.1.toml (100%) rename providers/llmgateway/models/{mistral => }/mistral-large-latest.toml (100%) rename providers/llmgateway/models/{mistral => }/mixtral-8x7b-instruct-together.toml (100%) rename providers/llmgateway/models/{nvidia => }/nemotron-nano-9b-v2.toml (100%) rename providers/llmgateway/models/{openai => }/o1-mini.toml (100%) rename providers/llmgateway/models/{openai => }/o1.toml (100%) rename providers/llmgateway/models/{openai => }/o3-mini.toml (100%) rename providers/llmgateway/models/{openai => }/o3.toml (100%) rename providers/llmgateway/models/{mistral => }/pixtral-large-latest.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-flash.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-image-max-2025-12-30.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-image-max.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-image-plus.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-image.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-max-latest.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-max.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-omni-turbo.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-plus-latest.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-plus.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-turbo.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-vl-max.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen-vl-plus.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen2-5-vl-72b-instruct.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen25-coder-7b.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-235b-a22b-instruct-2507.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-235b-a22b-thinking-2507.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-30b-a3b-instruct-2507.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-30b-a3b-thinking-2507.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-32b.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-coder-30b-a3b-instruct.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-coder-480b-a35b-instruct.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-coder-plus.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-coder.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-max.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-next-80b-a3b-instruct.toml (100%) rename providers/llmgateway/models/{alibaba => }/qwen3-next-80b-a3b-thinking.toml (100%) rename providers/llmgateway/models/{bytedance => }/seed-1-6-250615.toml (100%) rename providers/llmgateway/models/{bytedance => }/seed-1-6-250915.toml (100%) rename providers/llmgateway/models/{bytedance => }/seed-1-6-flash-250715.toml (100%) rename providers/llmgateway/models/{bytedance => }/seed-1-8-251228.toml (100%) rename providers/llmgateway/models/{bytedance => }/seedream-4-0.toml (100%) rename providers/llmgateway/models/{bytedance => }/seedream-4-5.toml (100%) rename providers/llmgateway/models/{perplexity => }/sonar-pro.toml (100%) rename providers/llmgateway/models/{perplexity => }/sonar-reasoning-pro.toml (100%) rename providers/llmgateway/models/{perplexity => }/sonar.toml (100%) diff --git a/providers/llmgateway/README.md b/providers/llmgateway/README.md index 8292fff56..ff4c0448f 100644 --- a/providers/llmgateway/README.md +++ b/providers/llmgateway/README.md @@ -4,20 +4,10 @@ This provider enables access to 150+ AI models through [LLM Gateway](https://llm ## Directory Structure -- **models/**: TOML configuration files organized by upstream provider - - **anthropic/**: Claude models - - **openai/**: GPT and o-series models - - **google/**: Gemini and Gemma models - - **meta/**: Llama models - - **xai/**: Grok models - - **deepseek/**: DeepSeek models - - **alibaba/**: Qwen models - - **mistral/**: Mistral and Mixtral models - - **zai/**: GLM models - - **llmgateway/**: LLM Gateway native models (auto-routing) - - And more... +- **models/**: TOML configuration files for all supported models - **scripts/**: Scripts for generating model configurations - **provider.toml**: Provider configuration +- **logo.svg**: Provider logo ## How It Works diff --git a/providers/llmgateway/models/llmgateway/auto.toml b/providers/llmgateway/models/auto.toml similarity index 100% rename from providers/llmgateway/models/llmgateway/auto.toml rename to providers/llmgateway/models/auto.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-5-haiku-20241022.toml b/providers/llmgateway/models/claude-3-5-haiku-20241022.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-5-haiku-20241022.toml rename to providers/llmgateway/models/claude-3-5-haiku-20241022.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-5-haiku.toml b/providers/llmgateway/models/claude-3-5-haiku.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-5-haiku.toml rename to providers/llmgateway/models/claude-3-5-haiku.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-5-sonnet-20240620.toml b/providers/llmgateway/models/claude-3-5-sonnet-20240620.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-5-sonnet-20240620.toml rename to providers/llmgateway/models/claude-3-5-sonnet-20240620.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-5-sonnet.toml b/providers/llmgateway/models/claude-3-5-sonnet.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-5-sonnet.toml rename to providers/llmgateway/models/claude-3-5-sonnet.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-7-sonnet-20250219.toml b/providers/llmgateway/models/claude-3-7-sonnet-20250219.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-7-sonnet-20250219.toml rename to providers/llmgateway/models/claude-3-7-sonnet-20250219.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-7-sonnet.toml b/providers/llmgateway/models/claude-3-7-sonnet.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-7-sonnet.toml rename to providers/llmgateway/models/claude-3-7-sonnet.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-haiku.toml b/providers/llmgateway/models/claude-3-haiku.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-haiku.toml rename to providers/llmgateway/models/claude-3-haiku.toml diff --git a/providers/llmgateway/models/anthropic/claude-3-opus.toml b/providers/llmgateway/models/claude-3-opus.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-3-opus.toml rename to providers/llmgateway/models/claude-3-opus.toml diff --git a/providers/llmgateway/models/anthropic/claude-haiku-4-5-20251001.toml b/providers/llmgateway/models/claude-haiku-4-5-20251001.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-haiku-4-5-20251001.toml rename to providers/llmgateway/models/claude-haiku-4-5-20251001.toml diff --git a/providers/llmgateway/models/anthropic/claude-haiku-4-5.toml b/providers/llmgateway/models/claude-haiku-4-5.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-haiku-4-5.toml rename to providers/llmgateway/models/claude-haiku-4-5.toml diff --git a/providers/llmgateway/models/anthropic/claude-opus-4-1-20250805.toml b/providers/llmgateway/models/claude-opus-4-1-20250805.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-opus-4-1-20250805.toml rename to providers/llmgateway/models/claude-opus-4-1-20250805.toml diff --git a/providers/llmgateway/models/anthropic/claude-opus-4-20250514.toml b/providers/llmgateway/models/claude-opus-4-20250514.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-opus-4-20250514.toml rename to providers/llmgateway/models/claude-opus-4-20250514.toml diff --git a/providers/llmgateway/models/anthropic/claude-opus-4-5-20251101.toml b/providers/llmgateway/models/claude-opus-4-5-20251101.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-opus-4-5-20251101.toml rename to providers/llmgateway/models/claude-opus-4-5-20251101.toml diff --git a/providers/llmgateway/models/anthropic/claude-sonnet-4-20250514.toml b/providers/llmgateway/models/claude-sonnet-4-20250514.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-sonnet-4-20250514.toml rename to providers/llmgateway/models/claude-sonnet-4-20250514.toml diff --git a/providers/llmgateway/models/anthropic/claude-sonnet-4-5-20250929.toml b/providers/llmgateway/models/claude-sonnet-4-5-20250929.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-sonnet-4-5-20250929.toml rename to providers/llmgateway/models/claude-sonnet-4-5-20250929.toml diff --git a/providers/llmgateway/models/anthropic/claude-sonnet-4-5.toml b/providers/llmgateway/models/claude-sonnet-4-5.toml similarity index 100% rename from providers/llmgateway/models/anthropic/claude-sonnet-4-5.toml rename to providers/llmgateway/models/claude-sonnet-4-5.toml diff --git a/providers/llmgateway/models/zai/cogview-4.toml b/providers/llmgateway/models/cogview-4.toml similarity index 100% rename from providers/llmgateway/models/zai/cogview-4.toml rename to providers/llmgateway/models/cogview-4.toml diff --git a/providers/llmgateway/models/llmgateway/custom.toml b/providers/llmgateway/models/custom.toml similarity index 100% rename from providers/llmgateway/models/llmgateway/custom.toml rename to providers/llmgateway/models/custom.toml diff --git a/providers/llmgateway/models/deepseek/deepseek-r1-0528.toml b/providers/llmgateway/models/deepseek-r1-0528.toml similarity index 100% rename from providers/llmgateway/models/deepseek/deepseek-r1-0528.toml rename to providers/llmgateway/models/deepseek-r1-0528.toml diff --git a/providers/llmgateway/models/deepseek/deepseek-r1t2-chimera-free.toml b/providers/llmgateway/models/deepseek-r1t2-chimera-free.toml similarity index 100% rename from providers/llmgateway/models/deepseek/deepseek-r1t2-chimera-free.toml rename to providers/llmgateway/models/deepseek-r1t2-chimera-free.toml diff --git a/providers/llmgateway/models/deepseek/deepseek-v3.1.toml b/providers/llmgateway/models/deepseek-v3.1.toml similarity index 100% rename from providers/llmgateway/models/deepseek/deepseek-v3.1.toml rename to providers/llmgateway/models/deepseek-v3.1.toml diff --git a/providers/llmgateway/models/deepseek/deepseek-v3.2.toml b/providers/llmgateway/models/deepseek-v3.2.toml similarity index 100% rename from providers/llmgateway/models/deepseek/deepseek-v3.2.toml rename to providers/llmgateway/models/deepseek-v3.2.toml diff --git a/providers/llmgateway/models/deepseek/deepseek-v3.toml b/providers/llmgateway/models/deepseek-v3.toml similarity index 100% rename from providers/llmgateway/models/deepseek/deepseek-v3.toml rename to providers/llmgateway/models/deepseek-v3.toml diff --git a/providers/llmgateway/models/google/gemini-2.0-flash-lite.toml b/providers/llmgateway/models/gemini-2.0-flash-lite.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.0-flash-lite.toml rename to providers/llmgateway/models/gemini-2.0-flash-lite.toml diff --git a/providers/llmgateway/models/google/gemini-2.0-flash.toml b/providers/llmgateway/models/gemini-2.0-flash.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.0-flash.toml rename to providers/llmgateway/models/gemini-2.0-flash.toml diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-image-preview.toml b/providers/llmgateway/models/gemini-2.5-flash-image-preview.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.5-flash-image-preview.toml rename to providers/llmgateway/models/gemini-2.5-flash-image-preview.toml diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-image.toml b/providers/llmgateway/models/gemini-2.5-flash-image.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.5-flash-image.toml rename to providers/llmgateway/models/gemini-2.5-flash-image.toml diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-lite-preview-09-2025.toml b/providers/llmgateway/models/gemini-2.5-flash-lite-preview-09-2025.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.5-flash-lite-preview-09-2025.toml rename to providers/llmgateway/models/gemini-2.5-flash-lite-preview-09-2025.toml diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-lite.toml b/providers/llmgateway/models/gemini-2.5-flash-lite.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.5-flash-lite.toml rename to providers/llmgateway/models/gemini-2.5-flash-lite.toml diff --git a/providers/llmgateway/models/google/gemini-2.5-flash-preview-09-2025.toml b/providers/llmgateway/models/gemini-2.5-flash-preview-09-2025.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.5-flash-preview-09-2025.toml rename to providers/llmgateway/models/gemini-2.5-flash-preview-09-2025.toml diff --git a/providers/llmgateway/models/google/gemini-2.5-flash.toml b/providers/llmgateway/models/gemini-2.5-flash.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.5-flash.toml rename to providers/llmgateway/models/gemini-2.5-flash.toml diff --git a/providers/llmgateway/models/google/gemini-2.5-pro.toml b/providers/llmgateway/models/gemini-2.5-pro.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-2.5-pro.toml rename to providers/llmgateway/models/gemini-2.5-pro.toml diff --git a/providers/llmgateway/models/google/gemini-3-flash-preview.toml b/providers/llmgateway/models/gemini-3-flash-preview.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-3-flash-preview.toml rename to providers/llmgateway/models/gemini-3-flash-preview.toml diff --git a/providers/llmgateway/models/google/gemini-3-pro-image-preview.toml b/providers/llmgateway/models/gemini-3-pro-image-preview.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-3-pro-image-preview.toml rename to providers/llmgateway/models/gemini-3-pro-image-preview.toml diff --git a/providers/llmgateway/models/google/gemini-3-pro-preview.toml b/providers/llmgateway/models/gemini-3-pro-preview.toml similarity index 100% rename from providers/llmgateway/models/google/gemini-3-pro-preview.toml rename to providers/llmgateway/models/gemini-3-pro-preview.toml diff --git a/providers/llmgateway/models/google/gemma-2-27b-it-together.toml b/providers/llmgateway/models/gemma-2-27b-it-together.toml similarity index 100% rename from providers/llmgateway/models/google/gemma-2-27b-it-together.toml rename to providers/llmgateway/models/gemma-2-27b-it-together.toml diff --git a/providers/llmgateway/models/google/gemma-3-12b-it.toml b/providers/llmgateway/models/gemma-3-12b-it.toml similarity index 100% rename from providers/llmgateway/models/google/gemma-3-12b-it.toml rename to providers/llmgateway/models/gemma-3-12b-it.toml diff --git a/providers/llmgateway/models/google/gemma-3-1b-it.toml b/providers/llmgateway/models/gemma-3-1b-it.toml similarity index 100% rename from providers/llmgateway/models/google/gemma-3-1b-it.toml rename to providers/llmgateway/models/gemma-3-1b-it.toml diff --git a/providers/llmgateway/models/google/gemma-3-27b.toml b/providers/llmgateway/models/gemma-3-27b.toml similarity index 100% rename from providers/llmgateway/models/google/gemma-3-27b.toml rename to providers/llmgateway/models/gemma-3-27b.toml diff --git a/providers/llmgateway/models/google/gemma-3-4b-it.toml b/providers/llmgateway/models/gemma-3-4b-it.toml similarity index 100% rename from providers/llmgateway/models/google/gemma-3-4b-it.toml rename to providers/llmgateway/models/gemma-3-4b-it.toml diff --git a/providers/llmgateway/models/google/gemma-3n-e2b-it.toml b/providers/llmgateway/models/gemma-3n-e2b-it.toml similarity index 100% rename from providers/llmgateway/models/google/gemma-3n-e2b-it.toml rename to providers/llmgateway/models/gemma-3n-e2b-it.toml diff --git a/providers/llmgateway/models/google/gemma-3n-e4b-it.toml b/providers/llmgateway/models/gemma-3n-e4b-it.toml similarity index 100% rename from providers/llmgateway/models/google/gemma-3n-e4b-it.toml rename to providers/llmgateway/models/gemma-3n-e4b-it.toml diff --git a/providers/llmgateway/models/zai/glm-4-32b-0414-128k.toml b/providers/llmgateway/models/glm-4-32b-0414-128k.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4-32b-0414-128k.toml rename to providers/llmgateway/models/glm-4-32b-0414-128k.toml diff --git a/providers/llmgateway/models/zai/glm-4.5-air-free.toml b/providers/llmgateway/models/glm-4.5-air-free.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.5-air-free.toml rename to providers/llmgateway/models/glm-4.5-air-free.toml diff --git a/providers/llmgateway/models/zai/glm-4.5-air.toml b/providers/llmgateway/models/glm-4.5-air.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.5-air.toml rename to providers/llmgateway/models/glm-4.5-air.toml diff --git a/providers/llmgateway/models/zai/glm-4.5-airx.toml b/providers/llmgateway/models/glm-4.5-airx.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.5-airx.toml rename to providers/llmgateway/models/glm-4.5-airx.toml diff --git a/providers/llmgateway/models/zai/glm-4.5-flash.toml b/providers/llmgateway/models/glm-4.5-flash.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.5-flash.toml rename to providers/llmgateway/models/glm-4.5-flash.toml diff --git a/providers/llmgateway/models/zai/glm-4.5-x.toml b/providers/llmgateway/models/glm-4.5-x.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.5-x.toml rename to providers/llmgateway/models/glm-4.5-x.toml diff --git a/providers/llmgateway/models/zai/glm-4.5.toml b/providers/llmgateway/models/glm-4.5.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.5.toml rename to providers/llmgateway/models/glm-4.5.toml diff --git a/providers/llmgateway/models/zai/glm-4.5v.toml b/providers/llmgateway/models/glm-4.5v.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.5v.toml rename to providers/llmgateway/models/glm-4.5v.toml diff --git a/providers/llmgateway/models/zai/glm-4.6.toml b/providers/llmgateway/models/glm-4.6.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.6.toml rename to providers/llmgateway/models/glm-4.6.toml diff --git a/providers/llmgateway/models/zai/glm-4.6v-flash.toml b/providers/llmgateway/models/glm-4.6v-flash.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.6v-flash.toml rename to providers/llmgateway/models/glm-4.6v-flash.toml diff --git a/providers/llmgateway/models/zai/glm-4.6v-flashx.toml b/providers/llmgateway/models/glm-4.6v-flashx.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.6v-flashx.toml rename to providers/llmgateway/models/glm-4.6v-flashx.toml diff --git a/providers/llmgateway/models/zai/glm-4.6v.toml b/providers/llmgateway/models/glm-4.6v.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.6v.toml rename to providers/llmgateway/models/glm-4.6v.toml diff --git a/providers/llmgateway/models/zai/glm-4.7-flash.toml b/providers/llmgateway/models/glm-4.7-flash.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.7-flash.toml rename to providers/llmgateway/models/glm-4.7-flash.toml diff --git a/providers/llmgateway/models/zai/glm-4.7-flashx.toml b/providers/llmgateway/models/glm-4.7-flashx.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.7-flashx.toml rename to providers/llmgateway/models/glm-4.7-flashx.toml diff --git a/providers/llmgateway/models/zai/glm-4.7.toml b/providers/llmgateway/models/glm-4.7.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-4.7.toml rename to providers/llmgateway/models/glm-4.7.toml diff --git a/providers/llmgateway/models/zai/glm-image.toml b/providers/llmgateway/models/glm-image.toml similarity index 100% rename from providers/llmgateway/models/zai/glm-image.toml rename to providers/llmgateway/models/glm-image.toml diff --git a/providers/llmgateway/models/openai/gpt-3.5-turbo.toml b/providers/llmgateway/models/gpt-3.5-turbo.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-3.5-turbo.toml rename to providers/llmgateway/models/gpt-3.5-turbo.toml diff --git a/providers/llmgateway/models/openai/gpt-4-turbo.toml b/providers/llmgateway/models/gpt-4-turbo.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4-turbo.toml rename to providers/llmgateway/models/gpt-4-turbo.toml diff --git a/providers/llmgateway/models/openai/gpt-4.1-mini.toml b/providers/llmgateway/models/gpt-4.1-mini.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4.1-mini.toml rename to providers/llmgateway/models/gpt-4.1-mini.toml diff --git a/providers/llmgateway/models/openai/gpt-4.1-nano.toml b/providers/llmgateway/models/gpt-4.1-nano.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4.1-nano.toml rename to providers/llmgateway/models/gpt-4.1-nano.toml diff --git a/providers/llmgateway/models/openai/gpt-4.1.toml b/providers/llmgateway/models/gpt-4.1.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4.1.toml rename to providers/llmgateway/models/gpt-4.1.toml diff --git a/providers/llmgateway/models/openai/gpt-4.toml b/providers/llmgateway/models/gpt-4.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4.toml rename to providers/llmgateway/models/gpt-4.toml diff --git a/providers/llmgateway/models/openai/gpt-4o-mini-search-preview.toml b/providers/llmgateway/models/gpt-4o-mini-search-preview.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4o-mini-search-preview.toml rename to providers/llmgateway/models/gpt-4o-mini-search-preview.toml diff --git a/providers/llmgateway/models/openai/gpt-4o-mini.toml b/providers/llmgateway/models/gpt-4o-mini.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4o-mini.toml rename to providers/llmgateway/models/gpt-4o-mini.toml diff --git a/providers/llmgateway/models/openai/gpt-4o-search-preview.toml b/providers/llmgateway/models/gpt-4o-search-preview.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4o-search-preview.toml rename to providers/llmgateway/models/gpt-4o-search-preview.toml diff --git a/providers/llmgateway/models/openai/gpt-4o.toml b/providers/llmgateway/models/gpt-4o.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-4o.toml rename to providers/llmgateway/models/gpt-4o.toml diff --git a/providers/llmgateway/models/openai/gpt-5-chat-latest.toml b/providers/llmgateway/models/gpt-5-chat-latest.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5-chat-latest.toml rename to providers/llmgateway/models/gpt-5-chat-latest.toml diff --git a/providers/llmgateway/models/openai/gpt-5-mini.toml b/providers/llmgateway/models/gpt-5-mini.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5-mini.toml rename to providers/llmgateway/models/gpt-5-mini.toml diff --git a/providers/llmgateway/models/openai/gpt-5-nano.toml b/providers/llmgateway/models/gpt-5-nano.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5-nano.toml rename to providers/llmgateway/models/gpt-5-nano.toml diff --git a/providers/llmgateway/models/openai/gpt-5-pro.toml b/providers/llmgateway/models/gpt-5-pro.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5-pro.toml rename to providers/llmgateway/models/gpt-5-pro.toml diff --git a/providers/llmgateway/models/openai/gpt-5.1-codex-mini.toml b/providers/llmgateway/models/gpt-5.1-codex-mini.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5.1-codex-mini.toml rename to providers/llmgateway/models/gpt-5.1-codex-mini.toml diff --git a/providers/llmgateway/models/openai/gpt-5.1-codex.toml b/providers/llmgateway/models/gpt-5.1-codex.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5.1-codex.toml rename to providers/llmgateway/models/gpt-5.1-codex.toml diff --git a/providers/llmgateway/models/openai/gpt-5.1.toml b/providers/llmgateway/models/gpt-5.1.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5.1.toml rename to providers/llmgateway/models/gpt-5.1.toml diff --git a/providers/llmgateway/models/openai/gpt-5.2-chat-latest.toml b/providers/llmgateway/models/gpt-5.2-chat-latest.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5.2-chat-latest.toml rename to providers/llmgateway/models/gpt-5.2-chat-latest.toml diff --git a/providers/llmgateway/models/openai/gpt-5.2-pro.toml b/providers/llmgateway/models/gpt-5.2-pro.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5.2-pro.toml rename to providers/llmgateway/models/gpt-5.2-pro.toml diff --git a/providers/llmgateway/models/openai/gpt-5.2.toml b/providers/llmgateway/models/gpt-5.2.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5.2.toml rename to providers/llmgateway/models/gpt-5.2.toml diff --git a/providers/llmgateway/models/openai/gpt-5.toml b/providers/llmgateway/models/gpt-5.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-5.toml rename to providers/llmgateway/models/gpt-5.toml diff --git a/providers/llmgateway/models/openai/gpt-oss-120b.toml b/providers/llmgateway/models/gpt-oss-120b.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-oss-120b.toml rename to providers/llmgateway/models/gpt-oss-120b.toml diff --git a/providers/llmgateway/models/openai/gpt-oss-20b-free.toml b/providers/llmgateway/models/gpt-oss-20b-free.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-oss-20b-free.toml rename to providers/llmgateway/models/gpt-oss-20b-free.toml diff --git a/providers/llmgateway/models/openai/gpt-oss-20b.toml b/providers/llmgateway/models/gpt-oss-20b.toml similarity index 100% rename from providers/llmgateway/models/openai/gpt-oss-20b.toml rename to providers/llmgateway/models/gpt-oss-20b.toml diff --git a/providers/llmgateway/models/xai/grok-3-mini.toml b/providers/llmgateway/models/grok-3-mini.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-3-mini.toml rename to providers/llmgateway/models/grok-3-mini.toml diff --git a/providers/llmgateway/models/xai/grok-3.toml b/providers/llmgateway/models/grok-3.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-3.toml rename to providers/llmgateway/models/grok-3.toml diff --git a/providers/llmgateway/models/xai/grok-4-0709.toml b/providers/llmgateway/models/grok-4-0709.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-4-0709.toml rename to providers/llmgateway/models/grok-4-0709.toml diff --git a/providers/llmgateway/models/xai/grok-4-1-fast-non-reasoning.toml b/providers/llmgateway/models/grok-4-1-fast-non-reasoning.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-4-1-fast-non-reasoning.toml rename to providers/llmgateway/models/grok-4-1-fast-non-reasoning.toml diff --git a/providers/llmgateway/models/xai/grok-4-1-fast-reasoning.toml b/providers/llmgateway/models/grok-4-1-fast-reasoning.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-4-1-fast-reasoning.toml rename to providers/llmgateway/models/grok-4-1-fast-reasoning.toml diff --git a/providers/llmgateway/models/xai/grok-4-fast-non-reasoning.toml b/providers/llmgateway/models/grok-4-fast-non-reasoning.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-4-fast-non-reasoning.toml rename to providers/llmgateway/models/grok-4-fast-non-reasoning.toml diff --git a/providers/llmgateway/models/xai/grok-4-fast-reasoning.toml b/providers/llmgateway/models/grok-4-fast-reasoning.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-4-fast-reasoning.toml rename to providers/llmgateway/models/grok-4-fast-reasoning.toml diff --git a/providers/llmgateway/models/xai/grok-4.toml b/providers/llmgateway/models/grok-4.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-4.toml rename to providers/llmgateway/models/grok-4.toml diff --git a/providers/llmgateway/models/xai/grok-code-fast-1.toml b/providers/llmgateway/models/grok-code-fast-1.toml similarity index 100% rename from providers/llmgateway/models/xai/grok-code-fast-1.toml rename to providers/llmgateway/models/grok-code-fast-1.toml diff --git a/providers/llmgateway/models/moonshot/kimi-k2-0905-free.toml b/providers/llmgateway/models/kimi-k2-0905-free.toml similarity index 100% rename from providers/llmgateway/models/moonshot/kimi-k2-0905-free.toml rename to providers/llmgateway/models/kimi-k2-0905-free.toml diff --git a/providers/llmgateway/models/moonshot/kimi-k2-thinking-turbo.toml b/providers/llmgateway/models/kimi-k2-thinking-turbo.toml similarity index 100% rename from providers/llmgateway/models/moonshot/kimi-k2-thinking-turbo.toml rename to providers/llmgateway/models/kimi-k2-thinking-turbo.toml diff --git a/providers/llmgateway/models/moonshot/kimi-k2-thinking.toml b/providers/llmgateway/models/kimi-k2-thinking.toml similarity index 100% rename from providers/llmgateway/models/moonshot/kimi-k2-thinking.toml rename to providers/llmgateway/models/kimi-k2-thinking.toml diff --git a/providers/llmgateway/models/moonshot/kimi-k2.toml b/providers/llmgateway/models/kimi-k2.toml similarity index 100% rename from providers/llmgateway/models/moonshot/kimi-k2.toml rename to providers/llmgateway/models/kimi-k2.toml diff --git a/providers/llmgateway/models/meta/llama-3.1-70b-instruct.toml b/providers/llmgateway/models/llama-3.1-70b-instruct.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-3.1-70b-instruct.toml rename to providers/llmgateway/models/llama-3.1-70b-instruct.toml diff --git a/providers/llmgateway/models/meta/llama-3.1-8b-instruct.toml b/providers/llmgateway/models/llama-3.1-8b-instruct.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-3.1-8b-instruct.toml rename to providers/llmgateway/models/llama-3.1-8b-instruct.toml diff --git a/providers/llmgateway/models/meta/llama-3.1-nemotron-ultra-253b.toml b/providers/llmgateway/models/llama-3.1-nemotron-ultra-253b.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-3.1-nemotron-ultra-253b.toml rename to providers/llmgateway/models/llama-3.1-nemotron-ultra-253b.toml diff --git a/providers/llmgateway/models/meta/llama-3.2-11b-instruct.toml b/providers/llmgateway/models/llama-3.2-11b-instruct.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-3.2-11b-instruct.toml rename to providers/llmgateway/models/llama-3.2-11b-instruct.toml diff --git a/providers/llmgateway/models/meta/llama-3.3-70b-instruct-free.toml b/providers/llmgateway/models/llama-3.3-70b-instruct-free.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-3.3-70b-instruct-free.toml rename to providers/llmgateway/models/llama-3.3-70b-instruct-free.toml diff --git a/providers/llmgateway/models/meta/llama-3.3-70b-instruct.toml b/providers/llmgateway/models/llama-3.3-70b-instruct.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-3.3-70b-instruct.toml rename to providers/llmgateway/models/llama-3.3-70b-instruct.toml diff --git a/providers/llmgateway/models/meta/llama-4-maverick-17b-instruct.toml b/providers/llmgateway/models/llama-4-maverick-17b-instruct.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-4-maverick-17b-instruct.toml rename to providers/llmgateway/models/llama-4-maverick-17b-instruct.toml diff --git a/providers/llmgateway/models/meta/llama-4-maverick-free.toml b/providers/llmgateway/models/llama-4-maverick-free.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-4-maverick-free.toml rename to providers/llmgateway/models/llama-4-maverick-free.toml diff --git a/providers/llmgateway/models/meta/llama-4-scout-17b-instruct.toml b/providers/llmgateway/models/llama-4-scout-17b-instruct.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-4-scout-17b-instruct.toml rename to providers/llmgateway/models/llama-4-scout-17b-instruct.toml diff --git a/providers/llmgateway/models/meta/llama-4-scout-free.toml b/providers/llmgateway/models/llama-4-scout-free.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-4-scout-free.toml rename to providers/llmgateway/models/llama-4-scout-free.toml diff --git a/providers/llmgateway/models/meta/llama-4-scout.toml b/providers/llmgateway/models/llama-4-scout.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-4-scout.toml rename to providers/llmgateway/models/llama-4-scout.toml diff --git a/providers/llmgateway/models/meta/llama-guard-4-12b.toml b/providers/llmgateway/models/llama-guard-4-12b.toml similarity index 100% rename from providers/llmgateway/models/meta/llama-guard-4-12b.toml rename to providers/llmgateway/models/llama-guard-4-12b.toml diff --git a/providers/llmgateway/models/minimax/minimax-m2.1.toml b/providers/llmgateway/models/minimax-m2.1.toml similarity index 100% rename from providers/llmgateway/models/minimax/minimax-m2.1.toml rename to providers/llmgateway/models/minimax-m2.1.toml diff --git a/providers/llmgateway/models/mistral/mistral-large-latest.toml b/providers/llmgateway/models/mistral-large-latest.toml similarity index 100% rename from providers/llmgateway/models/mistral/mistral-large-latest.toml rename to providers/llmgateway/models/mistral-large-latest.toml diff --git a/providers/llmgateway/models/mistral/mixtral-8x7b-instruct-together.toml b/providers/llmgateway/models/mixtral-8x7b-instruct-together.toml similarity index 100% rename from providers/llmgateway/models/mistral/mixtral-8x7b-instruct-together.toml rename to providers/llmgateway/models/mixtral-8x7b-instruct-together.toml diff --git a/providers/llmgateway/models/nvidia/nemotron-nano-9b-v2.toml b/providers/llmgateway/models/nemotron-nano-9b-v2.toml similarity index 100% rename from providers/llmgateway/models/nvidia/nemotron-nano-9b-v2.toml rename to providers/llmgateway/models/nemotron-nano-9b-v2.toml diff --git a/providers/llmgateway/models/openai/o1-mini.toml b/providers/llmgateway/models/o1-mini.toml similarity index 100% rename from providers/llmgateway/models/openai/o1-mini.toml rename to providers/llmgateway/models/o1-mini.toml diff --git a/providers/llmgateway/models/openai/o1.toml b/providers/llmgateway/models/o1.toml similarity index 100% rename from providers/llmgateway/models/openai/o1.toml rename to providers/llmgateway/models/o1.toml diff --git a/providers/llmgateway/models/openai/o3-mini.toml b/providers/llmgateway/models/o3-mini.toml similarity index 100% rename from providers/llmgateway/models/openai/o3-mini.toml rename to providers/llmgateway/models/o3-mini.toml diff --git a/providers/llmgateway/models/openai/o3.toml b/providers/llmgateway/models/o3.toml similarity index 100% rename from providers/llmgateway/models/openai/o3.toml rename to providers/llmgateway/models/o3.toml diff --git a/providers/llmgateway/models/mistral/pixtral-large-latest.toml b/providers/llmgateway/models/pixtral-large-latest.toml similarity index 100% rename from providers/llmgateway/models/mistral/pixtral-large-latest.toml rename to providers/llmgateway/models/pixtral-large-latest.toml diff --git a/providers/llmgateway/models/alibaba/qwen-flash.toml b/providers/llmgateway/models/qwen-flash.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-flash.toml rename to providers/llmgateway/models/qwen-flash.toml diff --git a/providers/llmgateway/models/alibaba/qwen-image-max-2025-12-30.toml b/providers/llmgateway/models/qwen-image-max-2025-12-30.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-image-max-2025-12-30.toml rename to providers/llmgateway/models/qwen-image-max-2025-12-30.toml diff --git a/providers/llmgateway/models/alibaba/qwen-image-max.toml b/providers/llmgateway/models/qwen-image-max.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-image-max.toml rename to providers/llmgateway/models/qwen-image-max.toml diff --git a/providers/llmgateway/models/alibaba/qwen-image-plus.toml b/providers/llmgateway/models/qwen-image-plus.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-image-plus.toml rename to providers/llmgateway/models/qwen-image-plus.toml diff --git a/providers/llmgateway/models/alibaba/qwen-image.toml b/providers/llmgateway/models/qwen-image.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-image.toml rename to providers/llmgateway/models/qwen-image.toml diff --git a/providers/llmgateway/models/alibaba/qwen-max-latest.toml b/providers/llmgateway/models/qwen-max-latest.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-max-latest.toml rename to providers/llmgateway/models/qwen-max-latest.toml diff --git a/providers/llmgateway/models/alibaba/qwen-max.toml b/providers/llmgateway/models/qwen-max.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-max.toml rename to providers/llmgateway/models/qwen-max.toml diff --git a/providers/llmgateway/models/alibaba/qwen-omni-turbo.toml b/providers/llmgateway/models/qwen-omni-turbo.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-omni-turbo.toml rename to providers/llmgateway/models/qwen-omni-turbo.toml diff --git a/providers/llmgateway/models/alibaba/qwen-plus-latest.toml b/providers/llmgateway/models/qwen-plus-latest.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-plus-latest.toml rename to providers/llmgateway/models/qwen-plus-latest.toml diff --git a/providers/llmgateway/models/alibaba/qwen-plus.toml b/providers/llmgateway/models/qwen-plus.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-plus.toml rename to providers/llmgateway/models/qwen-plus.toml diff --git a/providers/llmgateway/models/alibaba/qwen-turbo.toml b/providers/llmgateway/models/qwen-turbo.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-turbo.toml rename to providers/llmgateway/models/qwen-turbo.toml diff --git a/providers/llmgateway/models/alibaba/qwen-vl-max.toml b/providers/llmgateway/models/qwen-vl-max.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-vl-max.toml rename to providers/llmgateway/models/qwen-vl-max.toml diff --git a/providers/llmgateway/models/alibaba/qwen-vl-plus.toml b/providers/llmgateway/models/qwen-vl-plus.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen-vl-plus.toml rename to providers/llmgateway/models/qwen-vl-plus.toml diff --git a/providers/llmgateway/models/alibaba/qwen2-5-vl-72b-instruct.toml b/providers/llmgateway/models/qwen2-5-vl-72b-instruct.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen2-5-vl-72b-instruct.toml rename to providers/llmgateway/models/qwen2-5-vl-72b-instruct.toml diff --git a/providers/llmgateway/models/alibaba/qwen25-coder-7b.toml b/providers/llmgateway/models/qwen25-coder-7b.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen25-coder-7b.toml rename to providers/llmgateway/models/qwen25-coder-7b.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-235b-a22b-instruct-2507.toml b/providers/llmgateway/models/qwen3-235b-a22b-instruct-2507.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-235b-a22b-instruct-2507.toml rename to providers/llmgateway/models/qwen3-235b-a22b-instruct-2507.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-235b-a22b-thinking-2507.toml b/providers/llmgateway/models/qwen3-235b-a22b-thinking-2507.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-235b-a22b-thinking-2507.toml rename to providers/llmgateway/models/qwen3-235b-a22b-thinking-2507.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-30b-a3b-instruct-2507.toml b/providers/llmgateway/models/qwen3-30b-a3b-instruct-2507.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-30b-a3b-instruct-2507.toml rename to providers/llmgateway/models/qwen3-30b-a3b-instruct-2507.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-30b-a3b-thinking-2507.toml b/providers/llmgateway/models/qwen3-30b-a3b-thinking-2507.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-30b-a3b-thinking-2507.toml rename to providers/llmgateway/models/qwen3-30b-a3b-thinking-2507.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-32b.toml b/providers/llmgateway/models/qwen3-32b.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-32b.toml rename to providers/llmgateway/models/qwen3-32b.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-coder-30b-a3b-instruct.toml b/providers/llmgateway/models/qwen3-coder-30b-a3b-instruct.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-coder-30b-a3b-instruct.toml rename to providers/llmgateway/models/qwen3-coder-30b-a3b-instruct.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-coder-480b-a35b-instruct.toml b/providers/llmgateway/models/qwen3-coder-480b-a35b-instruct.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-coder-480b-a35b-instruct.toml rename to providers/llmgateway/models/qwen3-coder-480b-a35b-instruct.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-coder-plus.toml b/providers/llmgateway/models/qwen3-coder-plus.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-coder-plus.toml rename to providers/llmgateway/models/qwen3-coder-plus.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-coder.toml b/providers/llmgateway/models/qwen3-coder.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-coder.toml rename to providers/llmgateway/models/qwen3-coder.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-max.toml b/providers/llmgateway/models/qwen3-max.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-max.toml rename to providers/llmgateway/models/qwen3-max.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-instruct.toml b/providers/llmgateway/models/qwen3-next-80b-a3b-instruct.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-instruct.toml rename to providers/llmgateway/models/qwen3-next-80b-a3b-instruct.toml diff --git a/providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-thinking.toml b/providers/llmgateway/models/qwen3-next-80b-a3b-thinking.toml similarity index 100% rename from providers/llmgateway/models/alibaba/qwen3-next-80b-a3b-thinking.toml rename to providers/llmgateway/models/qwen3-next-80b-a3b-thinking.toml diff --git a/providers/llmgateway/models/bytedance/seed-1-6-250615.toml b/providers/llmgateway/models/seed-1-6-250615.toml similarity index 100% rename from providers/llmgateway/models/bytedance/seed-1-6-250615.toml rename to providers/llmgateway/models/seed-1-6-250615.toml diff --git a/providers/llmgateway/models/bytedance/seed-1-6-250915.toml b/providers/llmgateway/models/seed-1-6-250915.toml similarity index 100% rename from providers/llmgateway/models/bytedance/seed-1-6-250915.toml rename to providers/llmgateway/models/seed-1-6-250915.toml diff --git a/providers/llmgateway/models/bytedance/seed-1-6-flash-250715.toml b/providers/llmgateway/models/seed-1-6-flash-250715.toml similarity index 100% rename from providers/llmgateway/models/bytedance/seed-1-6-flash-250715.toml rename to providers/llmgateway/models/seed-1-6-flash-250715.toml diff --git a/providers/llmgateway/models/bytedance/seed-1-8-251228.toml b/providers/llmgateway/models/seed-1-8-251228.toml similarity index 100% rename from providers/llmgateway/models/bytedance/seed-1-8-251228.toml rename to providers/llmgateway/models/seed-1-8-251228.toml diff --git a/providers/llmgateway/models/bytedance/seedream-4-0.toml b/providers/llmgateway/models/seedream-4-0.toml similarity index 100% rename from providers/llmgateway/models/bytedance/seedream-4-0.toml rename to providers/llmgateway/models/seedream-4-0.toml diff --git a/providers/llmgateway/models/bytedance/seedream-4-5.toml b/providers/llmgateway/models/seedream-4-5.toml similarity index 100% rename from providers/llmgateway/models/bytedance/seedream-4-5.toml rename to providers/llmgateway/models/seedream-4-5.toml diff --git a/providers/llmgateway/models/perplexity/sonar-pro.toml b/providers/llmgateway/models/sonar-pro.toml similarity index 100% rename from providers/llmgateway/models/perplexity/sonar-pro.toml rename to providers/llmgateway/models/sonar-pro.toml diff --git a/providers/llmgateway/models/perplexity/sonar-reasoning-pro.toml b/providers/llmgateway/models/sonar-reasoning-pro.toml similarity index 100% rename from providers/llmgateway/models/perplexity/sonar-reasoning-pro.toml rename to providers/llmgateway/models/sonar-reasoning-pro.toml diff --git a/providers/llmgateway/models/perplexity/sonar.toml b/providers/llmgateway/models/sonar.toml similarity index 100% rename from providers/llmgateway/models/perplexity/sonar.toml rename to providers/llmgateway/models/sonar.toml diff --git a/providers/llmgateway/scripts/generate.ts b/providers/llmgateway/scripts/generate.ts index b2018fcef..26d0e3940 100644 --- a/providers/llmgateway/scripts/generate.ts +++ b/providers/llmgateway/scripts/generate.ts @@ -5,7 +5,7 @@ * npx tsx scripts/export-models-dev.ts * * The script reads models from @llmgateway/models and generates TOML files - * organized by provider subdirectory. + * in the models/ directory. */ // See: https://github.com/theopenco/llmgateway/blob/main/scripts/export-models-dev.ts From 09b5dd4d84deaa5d29c8ea3e71470f29f1e9e3aa Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:18:53 +0000 Subject: [PATCH 3/8] refactor: remove scripts/ dir, link to repo script Removes empty generate.ts file and scripts/ directory. README now links to llmgateway repo for regeneration. Co-Authored-By: Claude Opus 4.5 --- providers/llmgateway/README.md | 9 ++++++++- providers/llmgateway/scripts/generate.ts | 11 ----------- 2 files changed, 8 insertions(+), 12 deletions(-) delete mode 100644 providers/llmgateway/scripts/generate.ts diff --git a/providers/llmgateway/README.md b/providers/llmgateway/README.md index ff4c0448f..b1efbb418 100644 --- a/providers/llmgateway/README.md +++ b/providers/llmgateway/README.md @@ -5,10 +5,17 @@ This provider enables access to 150+ AI models through [LLM Gateway](https://llm ## Directory Structure - **models/**: TOML configuration files for all supported models -- **scripts/**: Scripts for generating model configurations - **provider.toml**: Provider configuration - **logo.svg**: Provider logo +## Regenerating Models + +Model configurations are generated from the [LLM Gateway repository](https://github.com/theopenco/llmgateway): + +```bash +npx tsx scripts/export-models-dev.ts +``` + ## How It Works LLM Gateway acts as a unified proxy for multiple AI providers. You can access any supported model through a single API endpoint using your LLM Gateway API key. diff --git a/providers/llmgateway/scripts/generate.ts b/providers/llmgateway/scripts/generate.ts deleted file mode 100644 index 26d0e3940..000000000 --- a/providers/llmgateway/scripts/generate.ts +++ /dev/null @@ -1,11 +0,0 @@ -/** - * This script generates model TOML files from the LLM Gateway models package. - * - * Run from the llmgateway repository root: - * npx tsx scripts/export-models-dev.ts - * - * The script reads models from @llmgateway/models and generates TOML files - * in the models/ directory. - */ - -// See: https://github.com/theopenco/llmgateway/blob/main/scripts/export-models-dev.ts From e28d4e387fee2256b6f7e8bea20fe9e413632845 Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:21:06 +0000 Subject: [PATCH 4/8] chore: trigger CI From b22ff136a8341e838749f544592f3047791c016d Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:25:53 +0000 Subject: [PATCH 5/8] fix: add required output limit to all models models.dev schema requires limit.output field. Defaults to 16384 when not specified. Co-Authored-By: Claude Opus 4.5 --- providers/llmgateway/models/auto.toml | 1 + providers/llmgateway/models/claude-3-5-sonnet.toml | 1 + providers/llmgateway/models/claude-opus-4-20250514.toml | 1 + providers/llmgateway/models/claude-sonnet-4-20250514.toml | 1 + providers/llmgateway/models/custom.toml | 1 + providers/llmgateway/models/deepseek-r1-0528.toml | 1 + providers/llmgateway/models/deepseek-r1t2-chimera-free.toml | 1 + providers/llmgateway/models/deepseek-v3.2.toml | 1 + providers/llmgateway/models/deepseek-v3.toml | 1 + providers/llmgateway/models/gemini-2.0-flash-lite.toml | 1 + providers/llmgateway/models/gemini-2.0-flash.toml | 1 + .../llmgateway/models/gemini-2.5-flash-lite-preview-09-2025.toml | 1 + providers/llmgateway/models/gemini-2.5-flash-lite.toml | 1 + .../llmgateway/models/gemini-2.5-flash-preview-09-2025.toml | 1 + providers/llmgateway/models/gemini-2.5-flash.toml | 1 + providers/llmgateway/models/gemini-2.5-pro.toml | 1 + providers/llmgateway/models/gemma-2-27b-it-together.toml | 1 + providers/llmgateway/models/gemma-3-12b-it.toml | 1 + providers/llmgateway/models/gemma-3-1b-it.toml | 1 + providers/llmgateway/models/gemma-3-27b.toml | 1 + providers/llmgateway/models/gemma-3-4b-it.toml | 1 + providers/llmgateway/models/gemma-3n-e2b-it.toml | 1 + providers/llmgateway/models/gemma-3n-e4b-it.toml | 1 + providers/llmgateway/models/glm-4-32b-0414-128k.toml | 1 + providers/llmgateway/models/glm-4.5-air-free.toml | 1 + providers/llmgateway/models/glm-4.5-air.toml | 1 + providers/llmgateway/models/glm-4.5-airx.toml | 1 + providers/llmgateway/models/glm-4.5-flash.toml | 1 + providers/llmgateway/models/glm-4.5-x.toml | 1 + providers/llmgateway/models/glm-4.5.toml | 1 + providers/llmgateway/models/glm-4.6.toml | 1 + providers/llmgateway/models/gpt-3.5-turbo.toml | 1 + providers/llmgateway/models/gpt-4-turbo.toml | 1 + providers/llmgateway/models/gpt-4.1-mini.toml | 1 + providers/llmgateway/models/gpt-4.1-nano.toml | 1 + providers/llmgateway/models/gpt-4.1.toml | 1 + providers/llmgateway/models/gpt-oss-20b-free.toml | 1 + providers/llmgateway/models/grok-3-mini.toml | 1 + providers/llmgateway/models/grok-3.toml | 1 + providers/llmgateway/models/grok-4-1-fast-non-reasoning.toml | 1 + providers/llmgateway/models/grok-4-1-fast-reasoning.toml | 1 + providers/llmgateway/models/grok-4-fast-non-reasoning.toml | 1 + providers/llmgateway/models/grok-4-fast-reasoning.toml | 1 + providers/llmgateway/models/kimi-k2-0905-free.toml | 1 + providers/llmgateway/models/llama-3.1-nemotron-ultra-253b.toml | 1 + providers/llmgateway/models/llama-3.2-11b-instruct.toml | 1 + providers/llmgateway/models/llama-3.3-70b-instruct-free.toml | 1 + providers/llmgateway/models/llama-3.3-70b-instruct.toml | 1 + providers/llmgateway/models/llama-4-maverick-free.toml | 1 + providers/llmgateway/models/llama-4-scout-free.toml | 1 + providers/llmgateway/models/llama-4-scout.toml | 1 + providers/llmgateway/models/llama-guard-4-12b.toml | 1 + providers/llmgateway/models/mistral-large-latest.toml | 1 + providers/llmgateway/models/mixtral-8x7b-instruct-together.toml | 1 + providers/llmgateway/models/nemotron-nano-9b-v2.toml | 1 + providers/llmgateway/models/o1-mini.toml | 1 + providers/llmgateway/models/o1.toml | 1 + providers/llmgateway/models/o3-mini.toml | 1 + providers/llmgateway/models/o3.toml | 1 + providers/llmgateway/models/pixtral-large-latest.toml | 1 + providers/llmgateway/models/seed-1-6-250615.toml | 1 + providers/llmgateway/models/seed-1-6-250915.toml | 1 + providers/llmgateway/models/seed-1-6-flash-250715.toml | 1 + providers/llmgateway/models/seed-1-8-251228.toml | 1 + providers/llmgateway/models/sonar-pro.toml | 1 + providers/llmgateway/models/sonar-reasoning-pro.toml | 1 + providers/llmgateway/models/sonar.toml | 1 + 67 files changed, 67 insertions(+) diff --git a/providers/llmgateway/models/auto.toml b/providers/llmgateway/models/auto.toml index 2b97f2d94..108cc28d1 100644 --- a/providers/llmgateway/models/auto.toml +++ b/providers/llmgateway/models/auto.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/claude-3-5-sonnet.toml b/providers/llmgateway/models/claude-3-5-sonnet.toml index 0990095d4..e06f756fc 100644 --- a/providers/llmgateway/models/claude-3-5-sonnet.toml +++ b/providers/llmgateway/models/claude-3-5-sonnet.toml @@ -16,6 +16,7 @@ cache_read = 0.30 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/claude-opus-4-20250514.toml b/providers/llmgateway/models/claude-opus-4-20250514.toml index 5198af3bb..54b6a2f56 100644 --- a/providers/llmgateway/models/claude-opus-4-20250514.toml +++ b/providers/llmgateway/models/claude-opus-4-20250514.toml @@ -16,6 +16,7 @@ cache_read = 1.50 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/claude-sonnet-4-20250514.toml b/providers/llmgateway/models/claude-sonnet-4-20250514.toml index f2b6be2ee..4853becd5 100644 --- a/providers/llmgateway/models/claude-sonnet-4-20250514.toml +++ b/providers/llmgateway/models/claude-sonnet-4-20250514.toml @@ -16,6 +16,7 @@ cache_read = 0.30 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/custom.toml b/providers/llmgateway/models/custom.toml index 704724161..043a3bcb8 100644 --- a/providers/llmgateway/models/custom.toml +++ b/providers/llmgateway/models/custom.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/deepseek-r1-0528.toml b/providers/llmgateway/models/deepseek-r1-0528.toml index c5ad7528a..a7e000a7b 100644 --- a/providers/llmgateway/models/deepseek-r1-0528.toml +++ b/providers/llmgateway/models/deepseek-r1-0528.toml @@ -16,6 +16,7 @@ output = 1.00 [limit] context = 32_770 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/deepseek-r1t2-chimera-free.toml b/providers/llmgateway/models/deepseek-r1t2-chimera-free.toml index a3acc1c18..04988cd0b 100644 --- a/providers/llmgateway/models/deepseek-r1t2-chimera-free.toml +++ b/providers/llmgateway/models/deepseek-r1t2-chimera-free.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 163_840 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/deepseek-v3.2.toml b/providers/llmgateway/models/deepseek-v3.2.toml index 7621f7616..6466fced7 100644 --- a/providers/llmgateway/models/deepseek-v3.2.toml +++ b/providers/llmgateway/models/deepseek-v3.2.toml @@ -16,6 +16,7 @@ cache_read = 0.03 [limit] context = 163_840 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/deepseek-v3.toml b/providers/llmgateway/models/deepseek-v3.toml index a8205555b..8daba1c87 100644 --- a/providers/llmgateway/models/deepseek-v3.toml +++ b/providers/llmgateway/models/deepseek-v3.toml @@ -15,6 +15,7 @@ output = 0.40 [limit] context = 163_840 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemini-2.0-flash-lite.toml b/providers/llmgateway/models/gemini-2.0-flash-lite.toml index ec66df596..d4d0e237c 100644 --- a/providers/llmgateway/models/gemini-2.0-flash-lite.toml +++ b/providers/llmgateway/models/gemini-2.0-flash-lite.toml @@ -15,6 +15,7 @@ output = 0.30 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemini-2.0-flash.toml b/providers/llmgateway/models/gemini-2.0-flash.toml index 13813e688..a041f03b2 100644 --- a/providers/llmgateway/models/gemini-2.0-flash.toml +++ b/providers/llmgateway/models/gemini-2.0-flash.toml @@ -15,6 +15,7 @@ output = 0.40 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemini-2.5-flash-lite-preview-09-2025.toml b/providers/llmgateway/models/gemini-2.5-flash-lite-preview-09-2025.toml index 3be518566..c3ca4f53d 100644 --- a/providers/llmgateway/models/gemini-2.5-flash-lite-preview-09-2025.toml +++ b/providers/llmgateway/models/gemini-2.5-flash-lite-preview-09-2025.toml @@ -16,6 +16,7 @@ cache_read = 0.03 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gemini-2.5-flash-lite.toml b/providers/llmgateway/models/gemini-2.5-flash-lite.toml index f2f36a655..9e75f16c6 100644 --- a/providers/llmgateway/models/gemini-2.5-flash-lite.toml +++ b/providers/llmgateway/models/gemini-2.5-flash-lite.toml @@ -16,6 +16,7 @@ cache_read = 0.03 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gemini-2.5-flash-preview-09-2025.toml b/providers/llmgateway/models/gemini-2.5-flash-preview-09-2025.toml index 016e176f4..9427be50e 100644 --- a/providers/llmgateway/models/gemini-2.5-flash-preview-09-2025.toml +++ b/providers/llmgateway/models/gemini-2.5-flash-preview-09-2025.toml @@ -16,6 +16,7 @@ cache_read = 0.08 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gemini-2.5-flash.toml b/providers/llmgateway/models/gemini-2.5-flash.toml index e554e4953..3c5116433 100644 --- a/providers/llmgateway/models/gemini-2.5-flash.toml +++ b/providers/llmgateway/models/gemini-2.5-flash.toml @@ -16,6 +16,7 @@ cache_read = 0.08 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gemini-2.5-pro.toml b/providers/llmgateway/models/gemini-2.5-pro.toml index 8b5822ce6..b4489f17e 100644 --- a/providers/llmgateway/models/gemini-2.5-pro.toml +++ b/providers/llmgateway/models/gemini-2.5-pro.toml @@ -15,6 +15,7 @@ output = 10.00 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gemma-2-27b-it-together.toml b/providers/llmgateway/models/gemma-2-27b-it-together.toml index 3fca28b14..5c6949729 100644 --- a/providers/llmgateway/models/gemma-2-27b-it-together.toml +++ b/providers/llmgateway/models/gemma-2-27b-it-together.toml @@ -15,6 +15,7 @@ output = 0.08 [limit] context = 8_192 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemma-3-12b-it.toml b/providers/llmgateway/models/gemma-3-12b-it.toml index 11359a07d..f79774a62 100644 --- a/providers/llmgateway/models/gemma-3-12b-it.toml +++ b/providers/llmgateway/models/gemma-3-12b-it.toml @@ -15,6 +15,7 @@ output = 0.30 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemma-3-1b-it.toml b/providers/llmgateway/models/gemma-3-1b-it.toml index f24d5f4af..94edf0326 100644 --- a/providers/llmgateway/models/gemma-3-1b-it.toml +++ b/providers/llmgateway/models/gemma-3-1b-it.toml @@ -15,6 +15,7 @@ output = 0.30 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemma-3-27b.toml b/providers/llmgateway/models/gemma-3-27b.toml index f985d5c43..dd9a9f441 100644 --- a/providers/llmgateway/models/gemma-3-27b.toml +++ b/providers/llmgateway/models/gemma-3-27b.toml @@ -15,6 +15,7 @@ output = 0.27 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gemma-3-4b-it.toml b/providers/llmgateway/models/gemma-3-4b-it.toml index aad27de8c..adfabe1db 100644 --- a/providers/llmgateway/models/gemma-3-4b-it.toml +++ b/providers/llmgateway/models/gemma-3-4b-it.toml @@ -15,6 +15,7 @@ output = 0.30 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemma-3n-e2b-it.toml b/providers/llmgateway/models/gemma-3n-e2b-it.toml index 39b1c0cfd..14ba44048 100644 --- a/providers/llmgateway/models/gemma-3n-e2b-it.toml +++ b/providers/llmgateway/models/gemma-3n-e2b-it.toml @@ -15,6 +15,7 @@ output = 0.30 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gemma-3n-e4b-it.toml b/providers/llmgateway/models/gemma-3n-e4b-it.toml index 338f81bb9..add3fd781 100644 --- a/providers/llmgateway/models/gemma-3n-e4b-it.toml +++ b/providers/llmgateway/models/gemma-3n-e4b-it.toml @@ -15,6 +15,7 @@ output = 0.30 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4-32b-0414-128k.toml b/providers/llmgateway/models/glm-4-32b-0414-128k.toml index 10c00a8d5..589c26730 100644 --- a/providers/llmgateway/models/glm-4-32b-0414-128k.toml +++ b/providers/llmgateway/models/glm-4-32b-0414-128k.toml @@ -15,6 +15,7 @@ output = 0.10 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4.5-air-free.toml b/providers/llmgateway/models/glm-4.5-air-free.toml index 3fdadfc97..da9213c4f 100644 --- a/providers/llmgateway/models/glm-4.5-air-free.toml +++ b/providers/llmgateway/models/glm-4.5-air-free.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 131_072 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4.5-air.toml b/providers/llmgateway/models/glm-4.5-air.toml index ad2807cd8..f4d82aabb 100644 --- a/providers/llmgateway/models/glm-4.5-air.toml +++ b/providers/llmgateway/models/glm-4.5-air.toml @@ -16,6 +16,7 @@ cache_read = 0.03 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4.5-airx.toml b/providers/llmgateway/models/glm-4.5-airx.toml index 9271836e0..b2753490b 100644 --- a/providers/llmgateway/models/glm-4.5-airx.toml +++ b/providers/llmgateway/models/glm-4.5-airx.toml @@ -16,6 +16,7 @@ cache_read = 0.22 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4.5-flash.toml b/providers/llmgateway/models/glm-4.5-flash.toml index c2a28d5f5..88ead7822 100644 --- a/providers/llmgateway/models/glm-4.5-flash.toml +++ b/providers/llmgateway/models/glm-4.5-flash.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4.5-x.toml b/providers/llmgateway/models/glm-4.5-x.toml index fd3226bc4..7b8ab8646 100644 --- a/providers/llmgateway/models/glm-4.5-x.toml +++ b/providers/llmgateway/models/glm-4.5-x.toml @@ -17,6 +17,7 @@ cache_read = 0.45 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4.5.toml b/providers/llmgateway/models/glm-4.5.toml index aa4e01188..ea514b061 100644 --- a/providers/llmgateway/models/glm-4.5.toml +++ b/providers/llmgateway/models/glm-4.5.toml @@ -16,6 +16,7 @@ cache_read = 0.11 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/glm-4.6.toml b/providers/llmgateway/models/glm-4.6.toml index 0019cbb11..fb2cdacd0 100644 --- a/providers/llmgateway/models/glm-4.6.toml +++ b/providers/llmgateway/models/glm-4.6.toml @@ -16,6 +16,7 @@ cache_read = 0.11 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gpt-3.5-turbo.toml b/providers/llmgateway/models/gpt-3.5-turbo.toml index 687b10243..66200229a 100644 --- a/providers/llmgateway/models/gpt-3.5-turbo.toml +++ b/providers/llmgateway/models/gpt-3.5-turbo.toml @@ -15,6 +15,7 @@ output = 1.50 [limit] context = 16_385 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/gpt-4-turbo.toml b/providers/llmgateway/models/gpt-4-turbo.toml index 3d8e0a676..e34fa95ba 100644 --- a/providers/llmgateway/models/gpt-4-turbo.toml +++ b/providers/llmgateway/models/gpt-4-turbo.toml @@ -15,6 +15,7 @@ output = 30.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gpt-4.1-mini.toml b/providers/llmgateway/models/gpt-4.1-mini.toml index 0d4a5028e..ea8f82488 100644 --- a/providers/llmgateway/models/gpt-4.1-mini.toml +++ b/providers/llmgateway/models/gpt-4.1-mini.toml @@ -15,6 +15,7 @@ output = 1.60 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gpt-4.1-nano.toml b/providers/llmgateway/models/gpt-4.1-nano.toml index 5fd989c10..2dc114d05 100644 --- a/providers/llmgateway/models/gpt-4.1-nano.toml +++ b/providers/llmgateway/models/gpt-4.1-nano.toml @@ -15,6 +15,7 @@ output = 0.40 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gpt-4.1.toml b/providers/llmgateway/models/gpt-4.1.toml index 9da5b49b1..028344e4e 100644 --- a/providers/llmgateway/models/gpt-4.1.toml +++ b/providers/llmgateway/models/gpt-4.1.toml @@ -15,6 +15,7 @@ output = 8.00 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/gpt-oss-20b-free.toml b/providers/llmgateway/models/gpt-oss-20b-free.toml index a7e17f57a..ad9142add 100644 --- a/providers/llmgateway/models/gpt-oss-20b-free.toml +++ b/providers/llmgateway/models/gpt-oss-20b-free.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 131_072 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/grok-3-mini.toml b/providers/llmgateway/models/grok-3-mini.toml index cce79b8b8..9ffc91d63 100644 --- a/providers/llmgateway/models/grok-3-mini.toml +++ b/providers/llmgateway/models/grok-3-mini.toml @@ -15,6 +15,7 @@ output = 0.50 [limit] context = 131_072 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/grok-3.toml b/providers/llmgateway/models/grok-3.toml index fc9570b94..aaa58f184 100644 --- a/providers/llmgateway/models/grok-3.toml +++ b/providers/llmgateway/models/grok-3.toml @@ -15,6 +15,7 @@ output = 15.00 [limit] context = 131_072 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/grok-4-1-fast-non-reasoning.toml b/providers/llmgateway/models/grok-4-1-fast-non-reasoning.toml index 58dc2022d..615e6b2a4 100644 --- a/providers/llmgateway/models/grok-4-1-fast-non-reasoning.toml +++ b/providers/llmgateway/models/grok-4-1-fast-non-reasoning.toml @@ -15,6 +15,7 @@ output = 15.00 [limit] context = 2_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/grok-4-1-fast-reasoning.toml b/providers/llmgateway/models/grok-4-1-fast-reasoning.toml index 55d855599..0b16eadbf 100644 --- a/providers/llmgateway/models/grok-4-1-fast-reasoning.toml +++ b/providers/llmgateway/models/grok-4-1-fast-reasoning.toml @@ -15,6 +15,7 @@ output = 15.00 [limit] context = 2_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/grok-4-fast-non-reasoning.toml b/providers/llmgateway/models/grok-4-fast-non-reasoning.toml index 1dae5d1b0..39807c91a 100644 --- a/providers/llmgateway/models/grok-4-fast-non-reasoning.toml +++ b/providers/llmgateway/models/grok-4-fast-non-reasoning.toml @@ -16,6 +16,7 @@ cache_read = 0.05 [limit] context = 2_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/grok-4-fast-reasoning.toml b/providers/llmgateway/models/grok-4-fast-reasoning.toml index 9b6b2c0dc..4778a6d64 100644 --- a/providers/llmgateway/models/grok-4-fast-reasoning.toml +++ b/providers/llmgateway/models/grok-4-fast-reasoning.toml @@ -16,6 +16,7 @@ cache_read = 0.05 [limit] context = 2_000_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/kimi-k2-0905-free.toml b/providers/llmgateway/models/kimi-k2-0905-free.toml index e386f653f..93ebbe4fb 100644 --- a/providers/llmgateway/models/kimi-k2-0905-free.toml +++ b/providers/llmgateway/models/kimi-k2-0905-free.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 131_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-3.1-nemotron-ultra-253b.toml b/providers/llmgateway/models/llama-3.1-nemotron-ultra-253b.toml index aad971910..db4efb8d0 100644 --- a/providers/llmgateway/models/llama-3.1-nemotron-ultra-253b.toml +++ b/providers/llmgateway/models/llama-3.1-nemotron-ultra-253b.toml @@ -15,6 +15,7 @@ output = 1.80 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-3.2-11b-instruct.toml b/providers/llmgateway/models/llama-3.2-11b-instruct.toml index 9956a2ee2..5bc16d2c1 100644 --- a/providers/llmgateway/models/llama-3.2-11b-instruct.toml +++ b/providers/llmgateway/models/llama-3.2-11b-instruct.toml @@ -16,6 +16,7 @@ output = 0.33 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-3.3-70b-instruct-free.toml b/providers/llmgateway/models/llama-3.3-70b-instruct-free.toml index 67cc88ec0..74b47b1f8 100644 --- a/providers/llmgateway/models/llama-3.3-70b-instruct-free.toml +++ b/providers/llmgateway/models/llama-3.3-70b-instruct-free.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 131_072 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-3.3-70b-instruct.toml b/providers/llmgateway/models/llama-3.3-70b-instruct.toml index b298b41f0..dd36a6d3c 100644 --- a/providers/llmgateway/models/llama-3.3-70b-instruct.toml +++ b/providers/llmgateway/models/llama-3.3-70b-instruct.toml @@ -15,6 +15,7 @@ output = 0.40 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-4-maverick-free.toml b/providers/llmgateway/models/llama-4-maverick-free.toml index 7aa7b2935..4bb90ca72 100644 --- a/providers/llmgateway/models/llama-4-maverick-free.toml +++ b/providers/llmgateway/models/llama-4-maverick-free.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-4-scout-free.toml b/providers/llmgateway/models/llama-4-scout-free.toml index b2ae4a8b2..6b13e6ded 100644 --- a/providers/llmgateway/models/llama-4-scout-free.toml +++ b/providers/llmgateway/models/llama-4-scout-free.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 1_000_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-4-scout.toml b/providers/llmgateway/models/llama-4-scout.toml index 256aa0138..a95487fee 100644 --- a/providers/llmgateway/models/llama-4-scout.toml +++ b/providers/llmgateway/models/llama-4-scout.toml @@ -16,6 +16,7 @@ output = 0.59 [limit] context = 32_768 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/llama-guard-4-12b.toml b/providers/llmgateway/models/llama-guard-4-12b.toml index 1d820fd0d..fa5977153 100644 --- a/providers/llmgateway/models/llama-guard-4-12b.toml +++ b/providers/llmgateway/models/llama-guard-4-12b.toml @@ -15,6 +15,7 @@ output = 0.20 [limit] context = 131_072 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/mistral-large-latest.toml b/providers/llmgateway/models/mistral-large-latest.toml index ea18276b1..5e308028e 100644 --- a/providers/llmgateway/models/mistral-large-latest.toml +++ b/providers/llmgateway/models/mistral-large-latest.toml @@ -15,6 +15,7 @@ output = 12.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/mixtral-8x7b-instruct-together.toml b/providers/llmgateway/models/mixtral-8x7b-instruct-together.toml index d078931b8..155c4e94a 100644 --- a/providers/llmgateway/models/mixtral-8x7b-instruct-together.toml +++ b/providers/llmgateway/models/mixtral-8x7b-instruct-together.toml @@ -15,6 +15,7 @@ output = 0.06 [limit] context = 32_768 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/nemotron-nano-9b-v2.toml b/providers/llmgateway/models/nemotron-nano-9b-v2.toml index 020437c46..c08033209 100644 --- a/providers/llmgateway/models/nemotron-nano-9b-v2.toml +++ b/providers/llmgateway/models/nemotron-nano-9b-v2.toml @@ -15,6 +15,7 @@ output = 0.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/o1-mini.toml b/providers/llmgateway/models/o1-mini.toml index 6e5858e7a..9792911dc 100644 --- a/providers/llmgateway/models/o1-mini.toml +++ b/providers/llmgateway/models/o1-mini.toml @@ -16,6 +16,7 @@ output = 4.40 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/o1.toml b/providers/llmgateway/models/o1.toml index fdcc29e57..eeea2a993 100644 --- a/providers/llmgateway/models/o1.toml +++ b/providers/llmgateway/models/o1.toml @@ -15,6 +15,7 @@ output = 60.00 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/o3-mini.toml b/providers/llmgateway/models/o3-mini.toml index 4ac3fa9b5..db4d9e80c 100644 --- a/providers/llmgateway/models/o3-mini.toml +++ b/providers/llmgateway/models/o3-mini.toml @@ -15,6 +15,7 @@ output = 4.40 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/o3.toml b/providers/llmgateway/models/o3.toml index bf81a3035..ec7e098e1 100644 --- a/providers/llmgateway/models/o3.toml +++ b/providers/llmgateway/models/o3.toml @@ -15,6 +15,7 @@ output = 8.00 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/pixtral-large-latest.toml b/providers/llmgateway/models/pixtral-large-latest.toml index f56e355b8..1d6c5af2e 100644 --- a/providers/llmgateway/models/pixtral-large-latest.toml +++ b/providers/llmgateway/models/pixtral-large-latest.toml @@ -15,6 +15,7 @@ output = 12.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/seed-1-6-250615.toml b/providers/llmgateway/models/seed-1-6-250615.toml index 5683b7a99..28d525143 100644 --- a/providers/llmgateway/models/seed-1-6-250615.toml +++ b/providers/llmgateway/models/seed-1-6-250615.toml @@ -16,6 +16,7 @@ cache_read = 0.05 [limit] context = 256_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/seed-1-6-250915.toml b/providers/llmgateway/models/seed-1-6-250915.toml index bb37198a3..28407e97c 100644 --- a/providers/llmgateway/models/seed-1-6-250915.toml +++ b/providers/llmgateway/models/seed-1-6-250915.toml @@ -16,6 +16,7 @@ cache_read = 0.05 [limit] context = 256_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/seed-1-6-flash-250715.toml b/providers/llmgateway/models/seed-1-6-flash-250715.toml index 4d152a0f8..0b587efe1 100644 --- a/providers/llmgateway/models/seed-1-6-flash-250715.toml +++ b/providers/llmgateway/models/seed-1-6-flash-250715.toml @@ -16,6 +16,7 @@ cache_read = 0.02 [limit] context = 256_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/seed-1-8-251228.toml b/providers/llmgateway/models/seed-1-8-251228.toml index 8f6998609..348e25027 100644 --- a/providers/llmgateway/models/seed-1-8-251228.toml +++ b/providers/llmgateway/models/seed-1-8-251228.toml @@ -16,6 +16,7 @@ cache_read = 0.05 [limit] context = 256_000 +output = 16_384 [modalities] input = ["text", "image"] diff --git a/providers/llmgateway/models/sonar-pro.toml b/providers/llmgateway/models/sonar-pro.toml index 80d05b4d1..012f3d1a2 100644 --- a/providers/llmgateway/models/sonar-pro.toml +++ b/providers/llmgateway/models/sonar-pro.toml @@ -15,6 +15,7 @@ output = 15.00 [limit] context = 200_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/sonar-reasoning-pro.toml b/providers/llmgateway/models/sonar-reasoning-pro.toml index 72f099ec5..b4d3006e7 100644 --- a/providers/llmgateway/models/sonar-reasoning-pro.toml +++ b/providers/llmgateway/models/sonar-reasoning-pro.toml @@ -15,6 +15,7 @@ output = 8.00 [limit] context = 128_000 +output = 16_384 [modalities] input = ["text"] diff --git a/providers/llmgateway/models/sonar.toml b/providers/llmgateway/models/sonar.toml index 8a9b44c64..5615ef7ec 100644 --- a/providers/llmgateway/models/sonar.toml +++ b/providers/llmgateway/models/sonar.toml @@ -15,6 +15,7 @@ output = 1.00 [limit] context = 130_000 +output = 16_384 [modalities] input = ["text"] From e8a67936545ae9d77c76b7377150d65ca68533ca Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:27:15 +0000 Subject: [PATCH 6/8] fix: use valid models.dev family enum values MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Maps internal family names to valid models.dev families: - moonshot → kimi - bytedance → seed - zai → glm - nvidia → nemotron Co-Authored-By: Claude Opus 4.5 --- providers/llmgateway/models/cogview-4.toml | 2 +- providers/llmgateway/models/kimi-k2-thinking-turbo.toml | 2 +- providers/llmgateway/models/kimi-k2-thinking.toml | 2 +- providers/llmgateway/models/kimi-k2.toml | 2 +- providers/llmgateway/models/nemotron-nano-9b-v2.toml | 2 +- providers/llmgateway/models/seed-1-6-250615.toml | 2 +- providers/llmgateway/models/seed-1-6-250915.toml | 2 +- providers/llmgateway/models/seed-1-6-flash-250715.toml | 2 +- providers/llmgateway/models/seed-1-8-251228.toml | 2 +- providers/llmgateway/models/seedream-4-0.toml | 2 +- providers/llmgateway/models/seedream-4-5.toml | 2 +- 11 files changed, 11 insertions(+), 11 deletions(-) diff --git a/providers/llmgateway/models/cogview-4.toml b/providers/llmgateway/models/cogview-4.toml index 45b21ce82..0eb9aac02 100644 --- a/providers/llmgateway/models/cogview-4.toml +++ b/providers/llmgateway/models/cogview-4.toml @@ -1,5 +1,5 @@ name = "CogView-4" -family = "zai" +family = "glm" release_date = "2025-03-04" last_updated = "2025-03-04" attachment = false diff --git a/providers/llmgateway/models/kimi-k2-thinking-turbo.toml b/providers/llmgateway/models/kimi-k2-thinking-turbo.toml index 89bf1d152..391a4f5a4 100644 --- a/providers/llmgateway/models/kimi-k2-thinking-turbo.toml +++ b/providers/llmgateway/models/kimi-k2-thinking-turbo.toml @@ -1,5 +1,5 @@ name = "Kimi K2 Thinking Turbo" -family = "moonshot" +family = "kimi" release_date = "2025-11-06" last_updated = "2025-11-06" attachment = false diff --git a/providers/llmgateway/models/kimi-k2-thinking.toml b/providers/llmgateway/models/kimi-k2-thinking.toml index fad4b66e4..4d1986388 100644 --- a/providers/llmgateway/models/kimi-k2-thinking.toml +++ b/providers/llmgateway/models/kimi-k2-thinking.toml @@ -1,5 +1,5 @@ name = "Kimi K2 Thinking" -family = "moonshot" +family = "kimi" release_date = "2025-11-06" last_updated = "2025-11-06" attachment = false diff --git a/providers/llmgateway/models/kimi-k2.toml b/providers/llmgateway/models/kimi-k2.toml index 8ee8fbdc1..e794e5092 100644 --- a/providers/llmgateway/models/kimi-k2.toml +++ b/providers/llmgateway/models/kimi-k2.toml @@ -1,5 +1,5 @@ name = "Kimi K2" -family = "moonshot" +family = "kimi" release_date = "2025-07-11" last_updated = "2025-07-11" attachment = false diff --git a/providers/llmgateway/models/nemotron-nano-9b-v2.toml b/providers/llmgateway/models/nemotron-nano-9b-v2.toml index c08033209..e80608bbd 100644 --- a/providers/llmgateway/models/nemotron-nano-9b-v2.toml +++ b/providers/llmgateway/models/nemotron-nano-9b-v2.toml @@ -1,5 +1,5 @@ name = "Nemotron Nano 9B V2 (Free)" -family = "nvidia" +family = "nemotron" release_date = "2025-08-18" last_updated = "2025-08-18" attachment = false diff --git a/providers/llmgateway/models/seed-1-6-250615.toml b/providers/llmgateway/models/seed-1-6-250615.toml index 28d525143..f005e5e57 100644 --- a/providers/llmgateway/models/seed-1-6-250615.toml +++ b/providers/llmgateway/models/seed-1-6-250615.toml @@ -1,5 +1,5 @@ name = "Seed 1.6 (250615)" -family = "bytedance" +family = "seed" release_date = "2025-06-25" last_updated = "2025-06-25" attachment = true diff --git a/providers/llmgateway/models/seed-1-6-250915.toml b/providers/llmgateway/models/seed-1-6-250915.toml index 28407e97c..436438370 100644 --- a/providers/llmgateway/models/seed-1-6-250915.toml +++ b/providers/llmgateway/models/seed-1-6-250915.toml @@ -1,5 +1,5 @@ name = "Seed 1.6 (250915)" -family = "bytedance" +family = "seed" release_date = "2025-09-15" last_updated = "2025-09-15" attachment = true diff --git a/providers/llmgateway/models/seed-1-6-flash-250715.toml b/providers/llmgateway/models/seed-1-6-flash-250715.toml index 0b587efe1..22a4b7277 100644 --- a/providers/llmgateway/models/seed-1-6-flash-250715.toml +++ b/providers/llmgateway/models/seed-1-6-flash-250715.toml @@ -1,5 +1,5 @@ name = "Seed 1.6 Flash (250715)" -family = "bytedance" +family = "seed" release_date = "2025-07-26" last_updated = "2025-07-26" attachment = true diff --git a/providers/llmgateway/models/seed-1-8-251228.toml b/providers/llmgateway/models/seed-1-8-251228.toml index 348e25027..46b0677e9 100644 --- a/providers/llmgateway/models/seed-1-8-251228.toml +++ b/providers/llmgateway/models/seed-1-8-251228.toml @@ -1,5 +1,5 @@ name = "Seed 1.8 (251228)" -family = "bytedance" +family = "seed" release_date = "2025-12-18" last_updated = "2025-12-18" attachment = true diff --git a/providers/llmgateway/models/seedream-4-0.toml b/providers/llmgateway/models/seedream-4-0.toml index 54b70ed17..df444f37e 100644 --- a/providers/llmgateway/models/seedream-4-0.toml +++ b/providers/llmgateway/models/seedream-4-0.toml @@ -1,5 +1,5 @@ name = "Seedream 4.0" -family = "bytedance" +family = "seed" release_date = "2025-09-16" last_updated = "2025-09-16" attachment = false diff --git a/providers/llmgateway/models/seedream-4-5.toml b/providers/llmgateway/models/seedream-4-5.toml index 1046c0e67..59d1b36c4 100644 --- a/providers/llmgateway/models/seedream-4-5.toml +++ b/providers/llmgateway/models/seedream-4-5.toml @@ -1,5 +1,5 @@ name = "Seedream 4.5" -family = "bytedance" +family = "seed" release_date = "2025-12-03" last_updated = "2025-12-03" attachment = false From 6b9b340fbcbbbb85e3dcfdaa430c3c7b00d60aa9 Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:28:38 +0000 Subject: [PATCH 7/8] fix: map llmgateway family to auto Co-Authored-By: Claude Opus 4.5 --- providers/llmgateway/models/auto.toml | 2 +- providers/llmgateway/models/custom.toml | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/providers/llmgateway/models/auto.toml b/providers/llmgateway/models/auto.toml index 108cc28d1..d6548da5b 100644 --- a/providers/llmgateway/models/auto.toml +++ b/providers/llmgateway/models/auto.toml @@ -1,5 +1,5 @@ name = "Auto Route" -family = "llmgateway" +family = "auto" release_date = "2024-01-01" last_updated = "2024-01-01" attachment = true diff --git a/providers/llmgateway/models/custom.toml b/providers/llmgateway/models/custom.toml index 043a3bcb8..2f244ede3 100644 --- a/providers/llmgateway/models/custom.toml +++ b/providers/llmgateway/models/custom.toml @@ -1,5 +1,5 @@ name = "Custom Model" -family = "llmgateway" +family = "auto" release_date = "2024-01-01" last_updated = "2024-01-01" attachment = true From 92269282eb3b1f2f19f2080ec52977ac5fa5a86b Mon Sep 17 00:00:00 2001 From: Luca Steeb Date: Fri, 23 Jan 2026 01:36:29 +0000 Subject: [PATCH 8/8] fix: use correct family for gemma and gpt-oss models - Gemma models now use "gemma" family instead of "gemini" - GPT OSS models now use "gpt-oss" family instead of "gpt" Co-Authored-By: Claude Opus 4.5 --- providers/llmgateway/models/gemma-2-27b-it-together.toml | 2 +- providers/llmgateway/models/gemma-3-12b-it.toml | 2 +- providers/llmgateway/models/gemma-3-1b-it.toml | 2 +- providers/llmgateway/models/gemma-3-27b.toml | 2 +- providers/llmgateway/models/gemma-3-4b-it.toml | 2 +- providers/llmgateway/models/gemma-3n-e2b-it.toml | 2 +- providers/llmgateway/models/gemma-3n-e4b-it.toml | 2 +- providers/llmgateway/models/gpt-oss-120b.toml | 2 +- providers/llmgateway/models/gpt-oss-20b.toml | 2 +- 9 files changed, 9 insertions(+), 9 deletions(-) diff --git a/providers/llmgateway/models/gemma-2-27b-it-together.toml b/providers/llmgateway/models/gemma-2-27b-it-together.toml index 5c6949729..f865b39dc 100644 --- a/providers/llmgateway/models/gemma-2-27b-it-together.toml +++ b/providers/llmgateway/models/gemma-2-27b-it-together.toml @@ -1,5 +1,5 @@ name = "Gemma 2 27B IT" -family = "gemini" +family = "gemma" release_date = "2024-06-27" last_updated = "2024-06-27" attachment = false diff --git a/providers/llmgateway/models/gemma-3-12b-it.toml b/providers/llmgateway/models/gemma-3-12b-it.toml index f79774a62..4f6aa660b 100644 --- a/providers/llmgateway/models/gemma-3-12b-it.toml +++ b/providers/llmgateway/models/gemma-3-12b-it.toml @@ -1,5 +1,5 @@ name = "Gemma 3 12B IT" -family = "gemini" +family = "gemma" release_date = "2025-03-10" last_updated = "2025-03-10" attachment = false diff --git a/providers/llmgateway/models/gemma-3-1b-it.toml b/providers/llmgateway/models/gemma-3-1b-it.toml index 94edf0326..19da323e9 100644 --- a/providers/llmgateway/models/gemma-3-1b-it.toml +++ b/providers/llmgateway/models/gemma-3-1b-it.toml @@ -1,5 +1,5 @@ name = "Gemma 3 1B IT" -family = "gemini" +family = "gemma" release_date = "2025-03-12" last_updated = "2025-03-12" attachment = false diff --git a/providers/llmgateway/models/gemma-3-27b.toml b/providers/llmgateway/models/gemma-3-27b.toml index dd9a9f441..a8bde1194 100644 --- a/providers/llmgateway/models/gemma-3-27b.toml +++ b/providers/llmgateway/models/gemma-3-27b.toml @@ -1,5 +1,5 @@ name = "Gemma 3 27B" -family = "gemini" +family = "gemma" release_date = "2025-03-12" last_updated = "2025-03-12" attachment = true diff --git a/providers/llmgateway/models/gemma-3-4b-it.toml b/providers/llmgateway/models/gemma-3-4b-it.toml index adfabe1db..967753f87 100644 --- a/providers/llmgateway/models/gemma-3-4b-it.toml +++ b/providers/llmgateway/models/gemma-3-4b-it.toml @@ -1,5 +1,5 @@ name = "Gemma 3 4B IT" -family = "gemini" +family = "gemma" release_date = "2025-03-10" last_updated = "2025-03-10" attachment = false diff --git a/providers/llmgateway/models/gemma-3n-e2b-it.toml b/providers/llmgateway/models/gemma-3n-e2b-it.toml index 14ba44048..41414c09b 100644 --- a/providers/llmgateway/models/gemma-3n-e2b-it.toml +++ b/providers/llmgateway/models/gemma-3n-e2b-it.toml @@ -1,5 +1,5 @@ name = "Gemma 3n E2B IT" -family = "gemini" +family = "gemma" release_date = "2025-06-26" last_updated = "2025-06-26" attachment = false diff --git a/providers/llmgateway/models/gemma-3n-e4b-it.toml b/providers/llmgateway/models/gemma-3n-e4b-it.toml index add3fd781..7512c1bb0 100644 --- a/providers/llmgateway/models/gemma-3n-e4b-it.toml +++ b/providers/llmgateway/models/gemma-3n-e4b-it.toml @@ -1,5 +1,5 @@ name = "Gemma 3n E4B IT" -family = "gemini" +family = "gemma" release_date = "2025-06-26" last_updated = "2025-06-26" attachment = false diff --git a/providers/llmgateway/models/gpt-oss-120b.toml b/providers/llmgateway/models/gpt-oss-120b.toml index 422a24553..708a32e86 100644 --- a/providers/llmgateway/models/gpt-oss-120b.toml +++ b/providers/llmgateway/models/gpt-oss-120b.toml @@ -1,5 +1,5 @@ name = "GPT OSS 120B" -family = "gpt" +family = "gpt-oss" release_date = "2025-08-05" last_updated = "2025-08-05" attachment = false diff --git a/providers/llmgateway/models/gpt-oss-20b.toml b/providers/llmgateway/models/gpt-oss-20b.toml index ee5983c6e..f095e5e02 100644 --- a/providers/llmgateway/models/gpt-oss-20b.toml +++ b/providers/llmgateway/models/gpt-oss-20b.toml @@ -1,5 +1,5 @@ name = "GPT OSS 20B" -family = "gpt" +family = "gpt-oss" release_date = "2025-08-05" last_updated = "2025-08-05" attachment = false